1. DATA EDA

In [28]:
import pandas as pd
import numpy as np
import seaborn as sns
import matplotlib.pyplot as plt
from statsmodels.stats.outliers_influence import variance_inflation_factor
from sklearn.preprocessing import StandardScaler
from sklearn.decomposition import PCA
from sklearn.metrics import mean_squared_error 

1.1 Variables 1.1.1 Numeric Variable 1.1.2 Categoric Variable(including date variables)

1.2 Target Variable

In [3]:
#bring data
df = pd.read_csv("C:/Users/KIM/Desktop/자기개발/kaggle competition/house-prices-advanced-regression-techniques/train.csv", index_col = 0)
In [4]:
df
Out[4]:
MSSubClass MSZoning LotFrontage LotArea Street Alley LotShape LandContour Utilities LotConfig ... PoolArea PoolQC Fence MiscFeature MiscVal MoSold YrSold SaleType SaleCondition SalePrice
Id
1 60 RL 65.0 8450 Pave NaN Reg Lvl AllPub Inside ... 0 NaN NaN NaN 0 2 2008 WD Normal 208500
2 20 RL 80.0 9600 Pave NaN Reg Lvl AllPub FR2 ... 0 NaN NaN NaN 0 5 2007 WD Normal 181500
3 60 RL 68.0 11250 Pave NaN IR1 Lvl AllPub Inside ... 0 NaN NaN NaN 0 9 2008 WD Normal 223500
4 70 RL 60.0 9550 Pave NaN IR1 Lvl AllPub Corner ... 0 NaN NaN NaN 0 2 2006 WD Abnorml 140000
5 60 RL 84.0 14260 Pave NaN IR1 Lvl AllPub FR2 ... 0 NaN NaN NaN 0 12 2008 WD Normal 250000
... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ...
1456 60 RL 62.0 7917 Pave NaN Reg Lvl AllPub Inside ... 0 NaN NaN NaN 0 8 2007 WD Normal 175000
1457 20 RL 85.0 13175 Pave NaN Reg Lvl AllPub Inside ... 0 NaN MnPrv NaN 0 2 2010 WD Normal 210000
1458 70 RL 66.0 9042 Pave NaN Reg Lvl AllPub Inside ... 0 NaN GdPrv Shed 2500 5 2010 WD Normal 266500
1459 20 RL 68.0 9717 Pave NaN Reg Lvl AllPub Inside ... 0 NaN NaN NaN 0 4 2010 WD Normal 142125
1460 20 RL 75.0 9937 Pave NaN Reg Lvl AllPub Inside ... 0 NaN NaN NaN 0 6 2008 WD Normal 147500

1460 rows × 80 columns

In [5]:
#1.1 Variables
#1.1.1 Numeric Variables
"""
LotFrontage, LotArea, MasVnrArea, BsmtFinSF1, BsmtFinSF2, BsmtUnfSF, (6)
TotalBsmtSF, 1stFlrSF, 2ndFlrSF, LowQualFinSF, GrLivArea, BsmtFullBath,(6)
BsmtHalfBath, FullBath, HalfBath, BedroomAbvGr, KitchenAbvGr, TotRmsAbvGrd, (6)
Fireplaces, GarageYrBlt, GarageCars, GarageArea, WoodDeckSF, (5)
OpenPorchSF,EnclosedPorch,3SsnPorch,ScreenPorch,PoolArea, (5)
MiscVal(1)
"""
numerical = [
'LotFrontage', 'LotArea', 'MasVnrArea', 'BsmtFinSF1', 'BsmtFinSF2', 'BsmtUnfSF',
'TotalBsmtSF', '1stFlrSF', '2ndFlrSF', 'LowQualFinSF', 'GrLivArea', 'BsmtFullBath',
'BsmtHalfBath', 'FullBath', 'HalfBath', 'BedroomAbvGr', 'KitchenAbvGr', 'TotRmsAbvGrd', 
'Fireplaces', 'GarageYrBlt', 'GarageCars', 'GarageArea', 'WoodDeckSF', 
'OpenPorchSF','EnclosedPorch','3SsnPorch','ScreenPorch','PoolArea', 'MiscVal'  
]
df[numerical].hist(bins=15, figsize=(30, 20), layout=(6, 5))
Out[5]:
array([[<matplotlib.axes._subplots.AxesSubplot object at 0x00000222AAC7CB08>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x00000222AACB2488>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x00000222AB975088>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x00000222AB9AE188>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x00000222AB9E5248>],
       [<matplotlib.axes._subplots.AxesSubplot object at 0x00000222ABA23E88>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x00000222ABA58488>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x00000222ABA8E588>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x00000222ABA99488>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x00000222ABAD2688>],
       [<matplotlib.axes._subplots.AxesSubplot object at 0x00000222ABB38888>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x00000222ABB6D988>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x00000222ABBA6AC8>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x00000222ABBDFBC8>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x00000222ABC16C88>],
       [<matplotlib.axes._subplots.AxesSubplot object at 0x00000222ABC4FDC8>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x00000222ABC86EC8>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x00000222ABCBFFC8>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x00000222ABCFB148>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x00000222ABD331C8>],
       [<matplotlib.axes._subplots.AxesSubplot object at 0x00000222ABD6D2C8>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x00000222ABDA6408>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x00000222ABDDE508>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x00000222ABE16608>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x00000222ABE4D6C8>],
       [<matplotlib.axes._subplots.AxesSubplot object at 0x00000222ABE85788>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x00000222ABEBD888>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x00000222ABEF59C8>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x00000222ABF2DAC8>,
        <matplotlib.axes._subplots.AxesSubplot object at 0x00000222ABF66BC8>]],
      dtype=object)
In [6]:
#column that only has "0"

zero_column = df[numerical].sum()
zero_column
Out[6]:
LotFrontage         84130.0
LotArea          15354569.0
MasVnrArea         150551.0
BsmtFinSF1         647714.0
BsmtFinSF2          67962.0
BsmtUnfSF          828171.0
TotalBsmtSF       1543847.0
1stFlrSF          1697435.0
2ndFlrSF           506609.0
LowQualFinSF         8533.0
GrLivArea         2212577.0
BsmtFullBath          621.0
BsmtHalfBath           84.0
FullBath             2285.0
HalfBath              559.0
BedroomAbvGr         4185.0
KitchenAbvGr         1528.0
TotRmsAbvGrd         9516.0
Fireplaces            895.0
GarageYrBlt       2728360.0
GarageCars           2580.0
GarageArea         690551.0
WoodDeckSF         137597.0
OpenPorchSF         68124.0
EnclosedPorch       32053.0
3SsnPorch            4978.0
ScreenPorch         21989.0
PoolArea             4028.0
MiscVal             63494.0
dtype: float64
In [7]:
#1.1.2 Categorical Variables 
categorical1 = ['MSSubClass','MSZoning','Street','Alley','LotShape','LandContour','Utilities']
categorical2 = ['LotConfig','LandSlope','Neighborhood','Condition1','Condition2','BldgType','HouseStyle']
categorical3 = ['OverallQual','OverallCond','YearBuilt','YearRemodAdd','RoofStyle','RoofMatl','Exterior1st']
categorical4 = ['Exterior2nd','MasVnrType','ExterQual','ExterCond','Foundation','BsmtQual','BsmtCond']
categorical5 = ['BsmtExposure','BsmtFinType1','BsmtFinType2','Heating','HeatingQC','CentralAir','Electrical']
categorical6 = ['KitchenQual','Functional','FireplaceQu','GarageType','GarageFinish','GarageQual','GarageCond']
categorical7 = ['PavedDrive','PoolQC','Fence','MiscFeature','MoSold','YrSold','SaleType','SaleCondition']

fig, ax = plt.subplots(4,2 , figsize=(15, 10))
for var, subplot in zip(categorical1, ax.flatten()):
    sns.boxplot(x=var, y='SalePrice', data=df, ax=subplot)

fig, ax = plt.subplots(4,2 , figsize=(15, 10))
for var, subplot in zip(categorical2, ax.flatten()):
    sns.boxplot(x=var, y='SalePrice', data=df, ax=subplot)
    
fig, ax = plt.subplots(4,2 , figsize=(15, 10))
for var, subplot in zip(categorical3, ax.flatten()):
    sns.boxplot(x=var, y='SalePrice', data=df, ax=subplot)
    
fig, ax = plt.subplots(4,2 , figsize=(15, 10))
for var, subplot in zip(categorical4, ax.flatten()):
    sns.boxplot(x=var, y='SalePrice', data=df, ax=subplot)
    
fig, ax = plt.subplots(4,2 , figsize=(15, 10))
for var, subplot in zip(categorical5, ax.flatten()):
    sns.boxplot(x=var, y='SalePrice', data=df, ax=subplot)

fig, ax = plt.subplots(4,2 , figsize=(15, 10))
for var, subplot in zip(categorical6, ax.flatten()):
    sns.boxplot(x=var, y='SalePrice', data=df, ax=subplot)
    
fig, ax = plt.subplots(4,2 , figsize=(15, 10))
for var, subplot in zip(categorical7, ax.flatten()):
    sns.boxplot(x=var, y='SalePrice', data=df, ax=subplot)
In [9]:
#1.2 target variable : SalePrice
df['SalePrice'].hist(bins=15, figsize=(8, 5))
Out[9]:
<matplotlib.axes._subplots.AxesSubplot at 0x222b24c7708>

2. Data Preprocessing

2.1 Fill nans

In [10]:
#fill nans with something else

#1.0 count nans
print("total nan count: ", df.isna().sum().sum())
print("nans in columns: ", df.isna().sum())

#1.0.0 if a variable has too many nans : delete that variable(column)
#1.0.1 fill nans with avg of each columns : numerical variables
df_numerical = df[numerical].fillna(df[numerical].mean())

#1.0.2 fill nans : categorical??  : fill with most frequent value??
categorical = categorical1 + categorical2 + categorical3 + categorical4 + categorical5 + categorical6 + categorical7 
df_categorical = df[categorical].apply(lambda x: x.fillna(x.value_counts().index[0]))

#1.0.3 y variale
y = df['SalePrice']

df=pd.concat([df_numerical, df_categorical,y], axis = 1)

print("total nan count: ", df.isna().sum().sum())
print("nans in columns: ",df.isna().sum())
total nan count:  6965
nans in columns:  MSSubClass         0
MSZoning           0
LotFrontage      259
LotArea            0
Street             0
                ... 
MoSold             0
YrSold             0
SaleType           0
SaleCondition      0
SalePrice          0
Length: 80, dtype: int64
total nan count:  0
nans in columns:  LotFrontage      0
LotArea          0
MasVnrArea       0
BsmtFinSF1       0
BsmtFinSF2       0
                ..
MoSold           0
YrSold           0
SaleType         0
SaleCondition    0
SalePrice        0
Length: 80, dtype: int64
In [11]:
df
Out[11]:
LotFrontage LotArea MasVnrArea BsmtFinSF1 BsmtFinSF2 BsmtUnfSF TotalBsmtSF 1stFlrSF 2ndFlrSF LowQualFinSF ... GarageCond PavedDrive PoolQC Fence MiscFeature MoSold YrSold SaleType SaleCondition SalePrice
Id
1 65.0 8450 196.0 706 0 150 856 856 854 0 ... TA Y Gd MnPrv Shed 2 2008 WD Normal 208500
2 80.0 9600 0.0 978 0 284 1262 1262 0 0 ... TA Y Gd MnPrv Shed 5 2007 WD Normal 181500
3 68.0 11250 162.0 486 0 434 920 920 866 0 ... TA Y Gd MnPrv Shed 9 2008 WD Normal 223500
4 60.0 9550 0.0 216 0 540 756 961 756 0 ... TA Y Gd MnPrv Shed 2 2006 WD Abnorml 140000
5 84.0 14260 350.0 655 0 490 1145 1145 1053 0 ... TA Y Gd MnPrv Shed 12 2008 WD Normal 250000
... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ...
1456 62.0 7917 0.0 0 0 953 953 953 694 0 ... TA Y Gd MnPrv Shed 8 2007 WD Normal 175000
1457 85.0 13175 119.0 790 163 589 1542 2073 0 0 ... TA Y Gd MnPrv Shed 2 2010 WD Normal 210000
1458 66.0 9042 0.0 275 0 877 1152 1188 1152 0 ... TA Y Gd GdPrv Shed 5 2010 WD Normal 266500
1459 68.0 9717 0.0 49 1029 0 1078 1078 0 0 ... TA Y Gd MnPrv Shed 4 2010 WD Normal 142125
1460 75.0 9937 0.0 830 290 136 1256 1256 0 0 ... TA Y Gd MnPrv Shed 6 2008 WD Normal 147500

1460 rows × 80 columns

2.2 Drop numerical variables with multicollinearity

In [12]:
#2.1 multicollinearity checking

#2.1.1 check multicollinearity among "numerical variables": If VIF >10 then that variable has multicollinearity
vif_data = pd.DataFrame()
vif_data["feature"] = df[numerical].columns
vif_data["VIF"] = [variance_inflation_factor(df[numerical].values, i) for i in range(len(df[numerical].columns))]
C:\Users\KIM\anaconda3\lib\site-packages\statsmodels\stats\outliers_influence.py:193: RuntimeWarning: divide by zero encountered in double_scalars
  vif = 1. / (1. - r_squared_i)
In [13]:
vif_data
Out[13]:
feature VIF
0 LotFrontage 15.617399
1 LotArea 2.587356
2 MasVnrArea 1.799190
3 BsmtFinSF1 inf
4 BsmtFinSF2 inf
5 BsmtUnfSF inf
6 TotalBsmtSF inf
7 1stFlrSF inf
8 2ndFlrSF inf
9 LowQualFinSF inf
10 GrLivArea inf
11 BsmtFullBath 3.564222
12 BsmtHalfBath 1.197847
13 FullBath 19.458272
14 HalfBath 2.997632
15 BedroomAbvGr 28.416082
16 KitchenAbvGr 29.411489
17 TotRmsAbvGrd 81.424035
18 Fireplaces 2.888910
19 GarageYrBlt 47.722183
20 GarageCars 34.621898
21 GarageArea 30.642974
22 WoodDeckSF 1.877392
23 OpenPorchSF 1.800334
24 EnclosedPorch 1.272064
25 3SsnPorch 1.033408
26 ScreenPorch 1.169930
27 PoolArea 1.096759
28 MiscVal 1.024630
In [14]:
#IF VIF >10 then that variable is known to have multicollinearity with other variables
df.drop(['BsmtFinSF1','BsmtFinSF2','BsmtUnfSF','TotalBsmtSF','1stFlrSF','2ndFlrSF','LowQualFinSF','GrLivArea','TotRmsAbvGrd'], axis=1, inplace=True)
In [15]:
df
Out[15]:
LotFrontage LotArea MasVnrArea BsmtFullBath BsmtHalfBath FullBath HalfBath BedroomAbvGr KitchenAbvGr Fireplaces ... GarageCond PavedDrive PoolQC Fence MiscFeature MoSold YrSold SaleType SaleCondition SalePrice
Id
1 65.0 8450 196.0 1 0 2 1 3 1 0 ... TA Y Gd MnPrv Shed 2 2008 WD Normal 208500
2 80.0 9600 0.0 0 1 2 0 3 1 1 ... TA Y Gd MnPrv Shed 5 2007 WD Normal 181500
3 68.0 11250 162.0 1 0 2 1 3 1 1 ... TA Y Gd MnPrv Shed 9 2008 WD Normal 223500
4 60.0 9550 0.0 1 0 1 0 3 1 1 ... TA Y Gd MnPrv Shed 2 2006 WD Abnorml 140000
5 84.0 14260 350.0 1 0 2 1 4 1 1 ... TA Y Gd MnPrv Shed 12 2008 WD Normal 250000
... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ...
1456 62.0 7917 0.0 0 0 2 1 3 1 1 ... TA Y Gd MnPrv Shed 8 2007 WD Normal 175000
1457 85.0 13175 119.0 1 0 2 0 3 1 2 ... TA Y Gd MnPrv Shed 2 2010 WD Normal 210000
1458 66.0 9042 0.0 0 0 2 0 4 1 2 ... TA Y Gd GdPrv Shed 5 2010 WD Normal 266500
1459 68.0 9717 0.0 1 0 1 0 2 1 0 ... TA Y Gd MnPrv Shed 4 2010 WD Normal 142125
1460 75.0 9937 0.0 1 0 1 1 3 1 0 ... TA Y Gd MnPrv Shed 6 2008 WD Normal 147500

1460 rows × 71 columns

2.3 Drop categorical variables with multicollinearity, by PCA after one-hot-encoding categorical variables

In [16]:
fin_y = df['SalePrice']
In [17]:
#2.3 One hot encoding only categorcal variables 
fin_x = df.loc[:, df.columns!='SalePrice']
fin_x_one_hot = pd.get_dummies(fin_x)
fin_x_one_hot.head(5)
Out[17]:
LotFrontage LotArea MasVnrArea BsmtFullBath BsmtHalfBath FullBath HalfBath BedroomAbvGr KitchenAbvGr Fireplaces ... SaleType_ConLw SaleType_New SaleType_Oth SaleType_WD SaleCondition_Abnorml SaleCondition_AdjLand SaleCondition_Alloca SaleCondition_Family SaleCondition_Normal SaleCondition_Partial
Id
1 65.0 8450 196.0 1 0 2 1 3 1 0 ... 0 0 0 1 0 0 0 0 1 0
2 80.0 9600 0.0 0 1 2 0 3 1 1 ... 0 0 0 1 0 0 0 0 1 0
3 68.0 11250 162.0 1 0 2 1 3 1 1 ... 0 0 0 1 0 0 0 0 1 0
4 60.0 9550 0.0 1 0 1 0 3 1 1 ... 0 0 0 1 1 0 0 0 0 0
5 84.0 14260 350.0 1 0 2 1 4 1 1 ... 0 0 0 1 0 0 0 0 1 0

5 rows × 279 columns

In [18]:
#standardization(both numerical and categorical varaibles)
scaler = StandardScaler()
fin_x_stand=scaler.fit_transform(fin_x_one_hot)
print(fin_x_stand.shape)
(1460, 279)
In [19]:
#PCA (both numerical and categorical) #131개로 85% 설명, 151개로 90%설명

# Loop Function to identify number of principal components that explain at least 85% of the variance
for comp in range(3, fin_x_stand.shape[1]):
    pca = PCA(n_components= comp, random_state=42)
    pca.fit(fin_x_stand)
    comp_check = pca.explained_variance_ratio_
    final_comp = comp
    if comp_check.sum() > 0.85:
        break
        
Final_PCA = PCA(n_components= final_comp,random_state=42)
Final_PCA.fit(fin_x_stand)
cluster_df=Final_PCA.transform(fin_x_stand) #final dataframe after PCA
num_comps = comp_check.shape[0]
print("Using {} components, we can explain {}% of the variability in the original data.".format(final_comp,comp_check.sum()))
Using 131 components, we can explain 0.8504905129815726% of the variability in the original data.
In [20]:
cluster_df.shape
Out[20]:
(1460, 131)
In [21]:
#to dataframe
fin_x = pd.DataFrame(cluster_df)

2.3 Remove outliers

In [22]:
#since we don't have a lot of data here, I won't remove any outliers...Maybe for better performances, I will....

2.4 Divide data to train/valid/test data

In [23]:
#concat fin_x and fin_y)
fin_df=pd.concat([fin_x, fin_y], axis = 1)
In [24]:
train_df, validate_df, test_df = np.split(fin_df.sample(frac=1), [int(.4*len(fin_df)), int(.7*len(fin_df))])
In [25]:
train_df
Out[25]:
0 1 2 3 4 5 6 7 8 9 ... 122 123 124 125 126 127 128 129 130 SalePrice
1320 1.848604 -4.066261 -0.027167 1.654556 -1.596239 -0.219456 0.316095 0.023938 0.189747 -0.282273 ... 0.058099 -0.259488 0.667925 0.008952 -0.038146 0.507983 0.352036 -1.507556 0.190584 111000.0
309 -6.464090 0.121125 3.424288 1.383345 -1.453800 0.434944 -0.566364 -0.739324 0.578719 2.022136 ... 0.938911 -0.171392 -0.251452 0.940274 0.785401 0.583321 0.226217 -0.250147 0.639014 82500.0
751 -3.479064 2.253071 -1.256313 -3.318174 -0.780026 -0.837351 1.232485 1.145197 -0.803659 -0.728762 ... -0.330501 -0.465258 0.649816 -1.201147 0.686879 -1.498306 0.273065 0.057768 -0.877124 96500.0
1422 -3.894058 2.471481 -3.184897 0.892515 2.610650 -2.002142 0.255965 -0.704022 2.423512 2.099561 ... 0.322870 -0.372124 0.118197 -0.571605 -0.443687 -0.144770 0.243440 -0.384350 -0.578949 127500.0
867 1.754506 -1.718710 -0.730321 0.262206 -1.531188 -1.149268 2.314404 1.414364 0.096641 0.291313 ... 0.104375 0.634254 0.780303 0.047784 -0.430769 0.070652 0.974944 0.383676 -1.383187 248900.0
... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ...
704 -4.661512 0.639714 -1.406257 -0.497498 -0.545557 -2.912151 1.445229 0.107580 1.172127 1.046550 ... 0.649289 -0.218130 -0.060713 -0.220868 -1.087713 -1.339558 -0.390723 -0.888748 0.087296 140000.0
510 2.443506 -4.563067 1.402458 1.130627 -0.456752 0.327434 -0.782610 1.628426 0.953320 0.176060 ... 0.831986 1.395367 -2.657604 0.638451 -0.269614 0.585963 2.474561 -0.104986 0.806993 124500.0
1257 3.598513 0.712288 -0.446503 -0.295386 -1.884812 -1.823127 -0.275341 1.100484 0.951111 0.577582 ... -0.685779 1.382168 0.092182 0.232143 -1.553589 -1.035287 -0.837404 0.267741 0.080008 301500.0
532 2.577726 -0.142444 -1.076895 0.336057 -0.731826 -1.941778 1.910293 0.500701 0.494599 -1.358917 ... -1.991046 1.244107 0.665385 0.909369 0.052820 -1.176005 1.387738 1.238806 0.606789 128000.0
676 9.349732 8.465874 6.817668 -2.804081 0.542873 3.668212 4.363106 -6.659886 1.302933 -0.902192 ... -1.100479 1.247859 2.073852 -1.772762 1.438705 1.319859 0.669150 2.588434 -1.186357 148500.0

584 rows × 132 columns

In [26]:
train_df = train_df.dropna(axis=0)
train_x = train_df.drop('SalePrice', axis=1)
train_y = train_df["SalePrice"]

validate_df = validate_df.dropna(axis=0)
valid_x = validate_df.drop('SalePrice', axis=1)
valid_y=validate_df["SalePrice"]

test_df = test_df.dropna(axis=0)
test_x = test_df.drop('SalePrice', axis=1)
test_y = test_df["SalePrice"]

3.1 model1 - random forest

In [38]:
from sklearn.ensemble import RandomForestRegressor
from sklearn.metrics import accuracy_score # 정확도 함수

clf = RandomForestRegressor(n_estimators=20, max_depth=5,random_state=0)
clf.fit(train_x,train_y)

predict1 = clf.predict(test_x)
In [28]:
#predict1.shape #(439,)
predict1
Out[28]:
array([170804.15801211, 199305.89852374, 187396.5044018 , 188111.05005443,
       304083.82153772, 166958.33019854, 170482.30885596, 173770.7329315 ,
       153582.7403209 , 228331.33183422, 184249.35380908, 192599.60909106,
       194387.09815769, 164077.01442039, 196425.95753373, 183215.54906983,
       190623.53404909, 168145.2129837 , 164671.43442381, 173001.71390418,
       191359.83521411, 163257.76125947, 319683.80273779, 164875.63403212,
       165236.11471602, 190472.72971538, 190108.08689043, 179788.54681382,
       173064.02231888, 181657.18240534, 170873.5461995 , 172493.15247218,
       218871.41653098, 170846.11678739, 186155.93657377, 181977.47621627,
       181294.39722656, 163264.79041743, 174577.80485473, 180615.9108095 ,
       168186.80761463, 254638.4043283 , 167861.71311936, 196693.3853321 ,
       164102.81785863, 226603.10111305, 181795.28709431, 162481.71098472,
       176740.72222044, 166348.21242801, 194268.65737652, 167875.89419411,
       222501.49909251, 220250.01997822, 189999.12065136, 199951.10583046,
       191732.4656445 , 194851.8515738 , 174477.62856509, 163021.91875119,
       167962.85834697, 173890.30606226, 167014.98879969, 183035.87122158,
       252246.56903918, 166653.76251893, 226763.49642357, 186747.9185184 ,
       198916.08035982, 384420.4515282 , 200146.15895476, 175039.43417718,
       195133.84232917, 188446.20703511, 167335.46702027, 169601.68071932,
       169437.36353673, 176813.05137815, 171906.86905061, 169278.62043299,
       195140.33574884, 160827.60935901, 179824.22332388, 195115.3543186 ,
       201164.01863389, 168365.37293826, 200054.40915732, 181995.51036673,
       178407.11038631, 172026.72154865, 170898.01634362, 173273.78678905,
       213191.53987672, 176260.67781345, 172454.54289675, 192171.28662092,
       167881.22336949, 184489.88766112, 195139.45153702, 339430.18821904,
       205411.76816457, 201178.39466805, 179014.94397595, 166862.78386969,
       182227.0494748 , 255370.17654095, 175142.080869  , 190347.04303251,
       181078.7807537 , 161333.19839201, 175096.94526154, 185404.34855352,
       204158.81520942, 180017.11706599, 186064.70797096, 191849.01337352,
       239212.0819567 , 174167.72995854, 185878.26081111, 197716.57687696,
       179623.2991039 , 167137.00493357, 185875.60095942, 190081.1844764 ,
       177882.7553615 , 170455.81770472, 169857.95486675, 174112.37329201,
       192305.89039775, 165608.06328772, 162753.14095721, 170919.7438847 ,
       325128.40199571, 173454.77772586, 175014.43619662, 156850.95980581,
       165844.87483625, 168525.63797682, 183261.63396273, 172879.00824531,
       180808.63860497, 212513.14104922, 198630.26566338, 198135.59321543,
       165017.95080918, 176814.40063606, 173381.55032265, 174874.42641   ,
       192010.06521203, 159944.09705962, 182999.99472185, 162362.12879271,
       178161.19402537, 169442.4687155 , 194328.777087  , 166068.98955922,
       184824.85077765, 246684.20358169, 168828.98881206, 166069.10802369,
       173100.3203168 , 177910.51376838, 177490.69836571, 377511.46204228,
       166687.07646402, 174105.63164517, 174871.31621484, 176424.40313991,
       165661.28153083, 156063.66172985, 163370.38674013, 167763.47315921,
       210158.76443868, 180423.66459494, 173930.67842892, 169100.59425471,
       177799.41456678, 186390.57785566, 172692.92121524, 263003.42240075,
       180744.06308933, 176950.67934117, 190441.38755677, 176811.84151608,
       186417.49211176, 189982.88892762, 219417.76595006, 185399.45623132,
       163681.54589076, 178367.46054675, 173640.36332863, 183773.58303134,
       208726.9323152 , 178033.94211545, 173640.44550149, 183065.94976253,
       180867.66569955, 166869.94631144, 170162.80861652, 171851.10378418,
       170404.01607785, 157603.80384927, 201945.95567211, 200332.03200545,
       183884.8347831 , 166949.51228959, 192064.24226961, 180216.99528309,
       160789.80090376, 176983.27328179, 181389.05613666, 191843.64808348,
       216541.85292508, 181753.58014209, 176798.52404764, 201856.58004328,
       178167.17473079, 193439.93617814, 162686.05739324, 185112.72893549,
       185920.24940013, 183522.27363016, 185972.84982558, 205748.04058002,
       170442.40999907, 158982.12563842, 170381.93192837, 178069.67566639,
       225801.15737059, 174310.4753669 , 181169.20958472, 181533.41070586,
       213004.32610269, 165010.61710855, 169877.17430719, 165263.38510662,
       172949.10317798, 166627.63977986, 255976.1558128 , 195139.4514161 ,
       162635.71064739, 194529.22086552, 220963.9780075 , 187786.22150152,
       181372.40653233, 203798.46997093, 186325.48379932, 178760.83214566,
       173368.13318118, 206898.01461399, 178265.08710505, 182055.92349157,
       162442.83750575, 258314.02913873, 166256.74245318, 163524.70859323,
       174264.56824742, 169966.13516028, 184056.5050026 , 175677.11213991,
       186657.18391305, 171365.27755388, 280108.8925933 , 195103.56177404,
       184456.91736974, 195922.21465838, 171468.54048636, 216342.62662035,
       170437.84645866, 161867.77079652, 172931.18193329, 179518.99750296,
       170633.94263419, 231758.74957237, 165688.44346636, 196814.43598111,
       182138.71620403, 153274.69216353, 193174.96272209, 170105.27725175,
       166301.77817241, 168042.30117383, 313422.44752267, 173297.28936188,
       191709.23404109, 185429.26051895, 169048.26494759, 170182.40873714,
       186914.6433398 , 174398.94622224, 172901.54609802, 181708.41031374,
       239302.57036716, 182539.96149967, 207248.55201889, 203902.22162433,
       221258.4423809 , 266538.95762686, 175055.87375088, 183132.79166497,
       187103.47848795, 161085.83173088, 168803.2063704 , 174856.69519139,
       165642.24307103, 207138.20059692, 174319.03603115, 190499.19991999,
       207802.51256879, 190839.13429364, 178381.48787776, 185109.40727583,
       186918.41769757, 163276.2738914 , 184873.3662854 , 204594.36977033,
       185390.25316444, 167711.02219425, 178204.89873261, 199971.12805181,
       182830.10105994, 168482.15731611, 220839.08648636, 168485.05502618,
       172521.1058638 , 178330.97648738, 187607.85578113, 221649.80952747,
       186050.23007869, 180932.15881172, 183683.58786307, 318300.15326755,
       173949.16022791, 180189.07094983, 171072.05463687, 186377.11301301,
       181131.22424434, 192716.81580115, 188668.24789379, 181807.90424589,
       181979.06896399, 167950.81608211, 207295.12135992, 174707.1888586 ,
       162087.1069718 , 170353.04468486, 228586.10778558, 170387.80918474,
       217889.80349443, 196635.84067151, 186655.12150092, 211375.90937572,
       168589.6212344 , 180517.14153056, 178421.63166715, 169059.078348  ,
       177638.81242767, 200684.03404486, 177598.80581528, 165459.0787819 ,
       215787.94589257, 165726.00809738, 203752.42228058, 198894.08768408,
       250755.27150979, 180856.00054368, 194403.21440277, 173031.46919072,
       175615.18321219, 179504.76935724, 175454.84904986, 189866.31741414,
       354989.24870581, 192755.1822482 , 182661.73360415, 164750.03172125,
       194601.2635369 , 182143.46412985, 168704.78307375, 184916.66510001,
       173425.37332523, 193566.47686033, 177109.30986299, 263122.30265251,
       160518.95494465, 197544.40147966, 175098.03516933, 197011.17119831,
       186291.6569078 , 320116.82096716, 212065.99244981, 205582.63022041,
       163711.67531729, 164403.72850959, 179851.67005966, 173237.34934037,
       167120.54628801, 164852.10241945, 170889.54294184, 171493.60702028,
       168113.92514853, 181742.35196146, 183824.14814652, 181182.86719663,
       191927.32076433, 193462.9799785 , 187683.52326996, 205373.00319569,
       170261.11188124, 181013.17826521, 171446.82434309, 210021.90182207,
       173302.06131404, 169662.13297886, 169992.51720156, 177525.66328075,
       170373.24617923, 285135.51876301, 204443.43695345, 177764.87683796,
       212855.10462066, 166537.93911547, 199285.72593411, 196877.32319577,
       319520.94261658, 168363.74755756, 187596.54140719, 358213.79358847,
       189001.29547692, 165758.81327114, 168659.78170494, 161240.88387216,
       185795.63792101, 194549.39164684, 190557.58673723, 305173.38698387,
       232882.8815902 , 180801.18300371, 180836.39191137])
In [29]:
test_y
Out[29]:
723     124500.0
1445    179600.0
1447    157900.0
54      385000.0
1186    104900.0
          ...   
69       80000.0
1182    392500.0
1412    140000.0
312     132000.0
1450     92000.0
Name: SalePrice, Length: 439, dtype: float64
In [30]:
test_x
Out[30]:
0 1 2 3 4 5 6 7 8 9 ... 121 122 123 124 125 126 127 128 129 130
723 2.964688 1.108189 -1.526426 0.106318 -1.042796 -0.612592 -1.032391 1.350073 -1.213383 -0.725471 ... 0.254233 0.004565 0.166516 -0.192522 0.230416 -0.312816 -0.793391 0.295259 -0.816092 -0.227311
1445 2.735676 -1.591089 -1.468329 1.071727 0.432595 -1.166412 -0.803060 0.772676 1.314567 0.632887 ... 0.884464 -1.727236 -0.055649 0.800140 -0.018565 -0.294392 1.178796 -1.332034 -0.768121 -0.123243
1447 -5.013797 0.493032 -1.197866 -2.794624 -0.234594 -0.239627 1.083601 -0.860849 -0.511962 0.387550 ... -0.583836 -0.769786 0.890560 -0.117715 0.012387 -0.821743 0.472884 0.034400 -0.179110 0.043905
54 4.136926 -2.873939 0.595933 0.507417 2.241932 -0.854528 -2.331029 0.376094 -3.234142 -0.455991 ... 0.162953 -0.789771 0.236854 -0.045141 1.328041 1.117209 -0.023157 -0.171450 0.845562 0.614847
1186 6.723059 1.712578 5.890442 -1.582244 4.679489 4.702633 -1.451959 -0.309356 -0.251688 5.220498 ... 0.222234 -1.853359 0.033253 -0.361165 -1.636066 -0.768555 2.416819 0.819171 -0.792724 1.797923
... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ... ...
69 2.172387 -0.808487 2.477093 -1.556855 -0.000057 0.542408 1.863973 -2.316841 -0.667263 -1.703224 ... -1.252408 0.645252 0.178384 -2.211365 -0.783801 0.160720 1.588978 -0.956403 0.773979 0.956843
1182 -6.409263 -2.428261 7.275868 -3.654681 -3.311630 11.733556 0.314062 1.212766 4.795634 -7.882574 ... 0.166486 0.592590 -0.657239 0.346196 0.694975 -0.667955 0.060696 1.738588 -1.676723 0.975703
1412 6.733677 3.457037 1.266721 2.745734 2.062651 0.352802 11.022980 -3.396504 -3.744251 -3.583932 ... 0.597551 -1.127908 -1.421101 -0.401232 1.240268 -1.021330 0.972074 0.034435 -0.147382 -0.074097
312 4.952066 1.422160 -1.451887 0.550482 2.051023 2.498262 -3.053314 1.050818 -0.896263 1.200291 ... 1.465287 -0.389000 -1.401231 0.186633 -0.178377 0.620381 -1.325567 0.570278 0.470974 0.453561
1450 1.621479 0.129355 -3.111755 -0.526160 1.554192 0.909834 3.317888 -0.116084 -2.044209 -0.761061 ... 0.172002 0.967188 0.243369 0.678146 0.880746 -0.424442 1.744801 -0.563968 0.833185 0.814238

439 rows × 131 columns

In [31]:
#MSE
print(mean_squared_error(test_y, predict1)**0.5) #rmse
81553.2328192636

3.2 model2 - GBM

In [29]:
from sklearn.ensemble import GradientBoostingRegressor

gb_clf = GradientBoostingRegressor(random_state = 0)
gb_clf.fit(train_x, train_y) 
이때, predict _ 
gb_pred = gb_clf.predict(test_x)
print(mean_squared_error(test_y, gb_pred)**0.5) #rmse
86231.12024571189
In [30]:
gb_pred
Out[30]:
array([180090.65878652, 180194.62118792, 178373.95764372, 174822.92370776,
       138934.49610489, 156865.55954029, 164799.28854393, 216436.88077777,
       161360.16703368, 188634.53687392, 145561.51441596, 193454.10876369,
       162049.4291099 , 160753.10472021, 185361.06183909, 191406.52071744,
       188461.05617389, 197192.09394978, 149926.54875668, 158640.26829547,
       134398.96691226, 153139.37832544, 154482.60219034, 152701.34162143,
       181026.85056599, 181849.69480777, 194203.14568695, 156994.75917599,
       214544.44594557, 331492.16154611, 189529.18202521, 165373.42754726,
       165559.63547916, 186053.04872021, 214893.7881934 , 209859.16368319,
       167310.88657884, 207763.27877076, 201263.59606257, 142392.74571533,
       211908.4787579 , 183238.28355833, 214708.87689714, 179359.30084616,
       169189.48363774, 153269.76395589, 151519.13997429, 179178.99701203,
       171922.60865982, 188594.26989367, 180074.96931598, 208650.17634869,
       204081.2762824 , 163818.30866441, 277864.93490689, 198543.43598868,
       225925.38037279, 223729.74368159, 184114.84665957, 222400.30356906,
       196427.82056872, 204648.55431559, 174471.96258975, 155496.47777149,
       168145.62504826, 193096.0920594 , 161044.45842093, 202844.23649115,
       199345.645978  , 156136.74734213, 171124.55213199, 221440.12834889,
       198696.33036989, 200260.17478093, 164566.27284388, 183834.68149496,
       186156.71276478, 170002.83860072, 190018.10166141, 189141.79959738,
       165499.70953747, 348607.86994486, 224850.12806853, 149573.03342503,
       160521.03221253, 157826.75432039, 204960.67243326, 150870.25460843,
       246017.4291673 , 207966.59211126, 190269.65310346, 178247.76473937,
       207329.04578477, 180344.15533868, 203551.28687516, 205895.67827976,
       201976.14005032, 169552.20847316, 157865.68320434, 188741.92838732,
       180763.84184319, 184411.32554114, 203777.47282951, 170871.91285812,
       203771.75756006, 195329.04775483, 165543.83634719, 165838.31061542,
       199552.90639895, 151453.8628795 , 201006.20276964, 150336.10388628,
       237010.21475533, 167398.00531837, 172764.89699673, 160195.70988638,
       130137.5047433 , 173998.01446339, 174222.69737618, 199480.55385826,
       191696.81953069, 135580.02616792, 162972.51171592, 185264.01332346,
       243254.65345032, 189635.23623713, 153174.89136909, 189134.30996495,
       240313.22919278, 175102.58239862, 157019.39502983, 168347.33951357,
       210314.51168214, 176338.43545837, 202677.7362189 , 166293.75779692,
       178852.54409587, 218384.017527  , 179615.90514181, 399453.77904726,
       195569.17193582, 209398.5683525 , 166454.33042797, 167348.82828713,
       171803.42399124, 235705.28685413, 243550.37322434, 175732.3781936 ,
       171843.82887081, 213641.26432618, 142969.50936745, 161229.66933407,
       148426.27266202, 174729.06705973, 191781.46036723, 156149.41380651,
       208122.12433912, 169535.44982483, 164481.08437487, 202575.00130472,
       206652.82765958, 205695.06247495, 217357.1287975 , 228695.93940945,
       197560.24739161, 198096.12733597, 146473.47377688, 175324.20833002,
       192222.96437434, 180069.79117816, 167531.8745685 , 198738.18337164,
       137327.97562239, 195908.09155421, 207710.2708911 , 164302.33334426,
       196095.87882227, 194616.07771942, 155825.50729963, 175020.46344822,
       174392.85847973, 174879.14863964, 176413.26549539, 189002.70700499,
       138445.06673538, 188622.54315204, 301332.93119747, 164073.88653556,
       202991.25611312, 149262.15575457, 155818.75535889, 208858.95111115,
       175923.59389918, 150158.98485147, 213754.02345278, 162412.69951067,
       287970.318786  , 263494.27918797, 167261.7862372 , 132885.18181943,
       187331.95700442, 217867.91813841, 145927.38177187, 181374.17906613,
       154044.9663035 , 185804.06236336, 160346.85115057, 151772.16048316,
       185123.92215738, 175976.99942653, 162223.1847279 , 183724.12624682,
       150239.8483688 , 200528.21537356, 268389.25244948, 172578.81503849,
       195193.10535513, 178955.35972482, 148413.84668668, 168062.3062221 ,
       182045.94235937, 187490.75214669, 178297.41791104, 162477.19744704,
       190174.0093809 , 198004.60118966, 193659.38270042, 189506.83887808,
       175951.8163147 , 365863.55137208, 186926.42299268, 171577.20323059,
       241535.21494513, 235510.26683741, 219332.59655335, 370439.38692558,
       193338.93428857, 173761.25818885, 189317.82921669, 190167.0741003 ,
       162370.44893871, 210697.58344289, 184771.74455743, 175893.1443015 ,
       186973.82218772, 177621.63081877, 180452.20470334, 208947.20955138,
       155464.16346715, 167734.15964443, 238619.16070939, 139945.79149113,
       148723.11598262, 198177.95241293, 258003.20709271, 187109.76591551,
       183737.69718636, 223180.09703792, 186049.42161655, 189431.26290738,
       148830.05229918, 166903.975006  , 179986.81441872, 160756.17762163,
       160633.59134204, 380054.40988535, 177101.39800785, 164944.05372734,
       174176.84532396, 180970.84459324, 124343.75003986, 187602.48070445,
       171277.3556903 , 190714.27148366, 177442.92728434, 175935.9044163 ,
       169566.18744725, 157040.00342309, 227960.14639574, 169820.57716441,
       475153.49908209, 175325.97452401, 164177.45910618, 183035.00176936,
       197773.29508681, 165158.62920466, 157243.08555486, 230150.92699678,
       214010.2040523 , 162207.35437734, 207025.41334213, 188639.61474974,
       159048.77940768, 211981.35143597, 168497.21385684, 186548.43449385,
       273575.37670184, 171295.64457453, 584255.25344569, 196612.52109597,
       199538.84322144, 169211.26380152, 227415.9878593 , 197418.44872096,
       182079.49605089, 157419.96949123, 188433.26820045, 159317.99196033,
       161822.83844396, 218111.73885991, 161558.41853262, 194351.33250217,
       166551.7276967 , 167198.47685993, 182087.3707697 , 199550.94486226,
       211277.98497117, 194855.84773148, 194015.18661373, 154642.42651508,
       180719.00542163, 171823.20121591, 181911.89103388, 197569.05752168,
       207379.19381217, 191009.78300244, 157432.04031991, 181233.20735627,
       190960.24047956, 257711.39561435, 158170.56234387, 232631.29958632,
       168870.55415334, 236343.68998325, 174388.02131455, 230894.2167905 ,
       179530.1613262 , 147145.63070697, 188453.71367726, 204517.56004665,
       135108.33424556, 188802.87610497, 163824.37096541, 188597.72630333,
       201815.56626537, 187945.49950822, 171727.69005749, 178696.11973444,
       212464.65122835, 187441.54423546, 168012.20720875, 204920.325722  ,
       171689.31309375, 161805.1785489 , 186273.86616676, 178607.25364404,
       202810.90239123, 204797.56733911, 192054.57390997, 216407.17084078,
       180937.02826789, 183150.91425419, 204457.79017607, 232671.88672745,
       191555.95552037, 211153.51559799, 151839.52446895, 176094.04151007,
       152376.57757492, 180152.36663611, 152629.3698433 , 166681.17548773,
       160935.13850895, 206864.81812145, 164977.63086432, 197039.95411956,
       152080.13974498, 191881.53799129, 227703.14118701, 153786.68170544,
       141435.25022524, 193162.42710413, 204360.00391154, 405194.35962149,
       171367.34094716, 173900.3783018 , 163574.6708386 , 140210.6381644 ,
       190877.76591788, 227644.76219253, 172171.26938983, 230515.47964311,
       177235.96550943, 169326.52373092, 155525.47677134, 178905.46333537,
       244606.64441916, 159013.02002545, 154806.87558884, 171281.45492232,
       151861.65127243, 212994.39938345, 195996.67178628, 182499.77481231,
       172645.45686385, 161666.21404551, 234020.50898558, 208507.63359797,
       171456.98261248, 219802.04522375, 164929.13905667, 142459.50275551,
       197275.75865999, 167218.35883903, 255311.96768829, 184315.72472937,
       191551.34538892, 209426.81604064, 182099.88627589, 200235.83375452,
       169961.8218497 , 184797.22904891, 168959.70861935, 207304.01309823,
       184470.42811695, 168907.05887625, 171798.6773019 , 191471.34404045,
       198784.8460898 , 259636.11356264, 167363.12527522, 183820.62962127,
       189339.90689467, 143069.35025514, 189936.66731099, 202527.16600682,
       200288.61220431])
In [31]:
test_y
Out[31]:
703     361919.0
668     193500.0
770     538000.0
528     446261.0
241     262500.0
          ...   
587     130000.0
73      185000.0
775     395000.0
1336    167900.0
1164    108959.0
Name: SalePrice, Length: 437, dtype: float64

3.3 model2 - xgboost

In [33]:
#!pip install xgboost
import xgboost
Collecting xgboost
  Downloading xgboost-1.6.2-py3-none-win_amd64.whl (125.4 MB)
Requirement already satisfied: numpy in c:\users\kim\anaconda3\lib\site-packages (from xgboost) (1.18.1)
Requirement already satisfied: scipy in c:\users\kim\anaconda3\lib\site-packages (from xgboost) (1.4.1)
Installing collected packages: xgboost
Successfully installed xgboost-1.6.2
In [232]:
xgb_model = xgboost.XGBRegressor(n_estimators=100, learning_rate=0.08, gamma=0, subsample=0.75,
                           colsample_bytree=1, max_depth=7)
xgb_model.fit(train_x,train_y)
xgb_pred = xgb_model.predict(test_x)
In [242]:
print(mean_squared_error(test_y, xgb_pred)**0.5) #rmse
86369.76066563524

3.3 model3 - light gbm

LightGBM is fast and accurate model, but sometimes occurs overfitting problems when data size is small.
In [34]:
from lightgbm import LGBMRegressor

lgb_clf = LGBMRegressor(num_leaves=31, objective='binary')
lgb_clf.fit(train_x, train_y)
lgbm_pred = lgb_clf.predict(test_x)
In [35]:
print(mean_squared_error(test_y, lgbm_pred)**0.5) #rmse
195432.12411843642

3.4 model 4 - ANN(3-layers)

In [25]:
import torch
import torch.nn as nn
import torch.nn.functional as F

class MultOutRegressor(nn.Module):
    def __init__(self, input_dim, target_dim, hidden_dim=32,seed=1234):
        super().__init__()
        torch.manual_seed(seed)
        self.hidden_dim = hidden_dim
        self.target_dim = target_dim

        self.fc1 = nn.Linear(input_dim, self.hidden_dim)
        self.fc2 = nn.Linear(self.hidden_dim, self.hidden_dim)
        self.fc3 = nn.Linear(self.hidden_dim, self.target_dim)

    def forward(self, x):
        x = self.fc1(x)
        x = F.relu(x)
        x = self.fc2(x)
        x = F.relu(x)
        x = self.fc3(x)
        return x
In [26]:
from torch.utils.data import Dataset
from torch.utils.data import DataLoader
class TabularDataSet(Dataset) :
    def __init__(self, X , Y) :
        self._X = np.float32(X)
        self._Y = Y

    def __len__(self,) :
        return len(self._Y)

    def __getitem__(self,idx) :
        return self._X[idx], self._Y[idx]
In [27]:
from torch import optim
from IPython import display

#convert dataframe to array for DataLoader 
numpy_x = train_x.to_numpy()
numpy_y = train_y.to_numpy()

tabulardataset = TabularDataSet(numpy_x,numpy_y) 
train_dl = DataLoader(tabulardataset) 
model = MultOutRegressor(131 , 1)
optimizer = optim.AdamW(model.parameters(), lr=0.001) #default lr = 0.01
criterion = nn.MSELoss()
In [33]:
def update(input , target , model, criterion , optimizer,max_norm=5) :
    optimizer.zero_grad()
    output = model(input)
    print('output : ',output)
    loss = criterion(output , target.float())
    print('loss: ', loss)
    loss.backward()
    torch.nn.utils.clip_grad_norm_(model.parameters(), max_norm)
    optimizer.step()
    return loss 

def one_epoch(dataloader , model, criterion , optimizer ) :
    result = torch.FloatTensor([0])
    print('epoch_result',result)
    for idx , (input , target) in enumerate(dataloader) :
        loss = update(input , target , model, criterion , optimizer)
        result = torch.add(result , loss)
    else :
        result /= idx+1
        return result.detach().cpu().numpy()

def visualize(result) :
    display.clear_output(wait=True)
    plt.plot(result)
    plt.show()

def train(n_epochs , dataloader , model, criterion , optimizer , log_interval=10) :
    epoch_loss = []
    for epoch in range(n_epochs) :
        loss = one_epoch(dataloader , model, criterion , optimizer )
        print('train_loss:',loss)
        if epoch > 0 :
            epoch_loss.append(loss)
        if epoch % log_interval == 0 :
            visualize(epoch_loss)
    else :
        return np.min(epoch_loss)
In [113]:
#train the model
train(500, train_dl ,model, criterion , optimizer,log_interval=50) #default n_epochs = 500 : min_loss = 2532927200.0
epoch_result tensor([0.])
output :  tensor([[157958.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(292714.8125, grad_fn=<MseLossBackward>)
output :  tensor([[118984.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(9094230., grad_fn=<MseLossBackward>)
output :  tensor([[195134.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(870605.6250, grad_fn=<MseLossBackward>)
output :  tensor([[175495.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2264413.7500, grad_fn=<MseLossBackward>)
output :  tensor([[155584.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0245e+08, grad_fn=<MseLossBackward>)
output :  tensor([[127889.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(12170.5713, grad_fn=<MseLossBackward>)
output :  tensor([[141483.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(233304.0938, grad_fn=<MseLossBackward>)
output :  tensor([[119956.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(915280.8750, grad_fn=<MseLossBackward>)
output :  tensor([[71885.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7917e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165516.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(233394.6719, grad_fn=<MseLossBackward>)
output :  tensor([[138299.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2891434.5000, grad_fn=<MseLossBackward>)
output :  tensor([[226129.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1276335., grad_fn=<MseLossBackward>)
output :  tensor([[169730.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(533082.5000, grad_fn=<MseLossBackward>)
output :  tensor([[250104.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(163771.9688, grad_fn=<MseLossBackward>)
output :  tensor([[55266.5117]], grad_fn=<AddmmBackward>)
loss:  tensor(71028.5000, grad_fn=<MseLossBackward>)
output :  tensor([[164872.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1502e+08, grad_fn=<MseLossBackward>)
output :  tensor([[167399.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(57763324., grad_fn=<MseLossBackward>)
output :  
C:\Users\KIM\anaconda3\lib\site-packages\torch\nn\modules\loss.py:528: UserWarning: Using a target size (torch.Size([1])) that is different to the input size (torch.Size([1, 1])). This will likely lead to incorrect results due to broadcasting. Please ensure they have the same size.
  return F.mse_loss(input, target, reduction=self.reduction)
tensor([[162634.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(37636884., grad_fn=<MseLossBackward>)
output :  tensor([[276178.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1388494., grad_fn=<MseLossBackward>)
output :  tensor([[196752.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(61155.7461, grad_fn=<MseLossBackward>)
output :  tensor([[135613.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6666e+10, grad_fn=<MseLossBackward>)
output :  tensor([[195629.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(3064523.7500, grad_fn=<MseLossBackward>)
output :  tensor([[177352.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2608e+09, grad_fn=<MseLossBackward>)
output :  tensor([[153406.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(5789663., grad_fn=<MseLossBackward>)
output :  tensor([[167822.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(4742799., grad_fn=<MseLossBackward>)
output :  tensor([[85430.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(907.5156, grad_fn=<MseLossBackward>)
output :  tensor([[168590.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0904e+09, grad_fn=<MseLossBackward>)
output :  tensor([[182777.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(4938395., grad_fn=<MseLossBackward>)
output :  tensor([[200936.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9772e+09, grad_fn=<MseLossBackward>)
output :  tensor([[110976.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(952713.2500, grad_fn=<MseLossBackward>)
output :  tensor([[172455.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2117343.2500, grad_fn=<MseLossBackward>)
output :  tensor([[136947.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(200214.2969, grad_fn=<MseLossBackward>)
output :  tensor([[127520.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2188827.7500, grad_fn=<MseLossBackward>)
output :  tensor([[120149.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(421292.2812, grad_fn=<MseLossBackward>)
output :  tensor([[148446.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(9.8888e+08, grad_fn=<MseLossBackward>)
output :  tensor([[169905.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1052e+10, grad_fn=<MseLossBackward>)
output :  tensor([[152716.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(9100309., grad_fn=<MseLossBackward>)
output :  tensor([[181956.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(3827097.5000, grad_fn=<MseLossBackward>)
output :  tensor([[142706.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2913742.2500, grad_fn=<MseLossBackward>)
output :  tensor([[106484.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7174e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137161.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0589e+09, grad_fn=<MseLossBackward>)
output :  tensor([[141029.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(36354304., grad_fn=<MseLossBackward>)
output :  tensor([[140113.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7197e+08, grad_fn=<MseLossBackward>)
output :  tensor([[226289.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1661722.3750, grad_fn=<MseLossBackward>)
output :  tensor([[132320.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(4992.3057, grad_fn=<MseLossBackward>)
output :  tensor([[151981.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(8889622., grad_fn=<MseLossBackward>)
output :  tensor([[116310.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(18576706., grad_fn=<MseLossBackward>)
output :  tensor([[163257.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(10609067., grad_fn=<MseLossBackward>)
output :  tensor([[145571.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4431e+09, grad_fn=<MseLossBackward>)
output :  tensor([[191892.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(11455.6885, grad_fn=<MseLossBackward>)
output :  tensor([[134784.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(111639.5156, grad_fn=<MseLossBackward>)
output :  tensor([[107094.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(8444382., grad_fn=<MseLossBackward>)
output :  tensor([[233669.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(109209.5938, grad_fn=<MseLossBackward>)
output :  tensor([[163019.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5473e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161450.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(6004414., grad_fn=<MseLossBackward>)
output :  tensor([[202497.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8901e+10, grad_fn=<MseLossBackward>)
output :  tensor([[240369.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2912e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143404.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(9081.4941, grad_fn=<MseLossBackward>)
output :  tensor([[131417.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(6667934.5000, grad_fn=<MseLossBackward>)
output :  tensor([[157439.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(5950931.5000, grad_fn=<MseLossBackward>)
output :  tensor([[130656.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(431351.3438, grad_fn=<MseLossBackward>)
output :  tensor([[183256.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8895e+09, grad_fn=<MseLossBackward>)
output :  tensor([[182149.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3804572.2500, grad_fn=<MseLossBackward>)
output :  tensor([[160105.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1944848.1250, grad_fn=<MseLossBackward>)
output :  tensor([[134880.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(65918668., grad_fn=<MseLossBackward>)
output :  tensor([[143168.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(447226.5625, grad_fn=<MseLossBackward>)
output :  tensor([[148809.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(14510624., grad_fn=<MseLossBackward>)
output :  tensor([[171313.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6748e+09, grad_fn=<MseLossBackward>)
output :  tensor([[190659.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9385e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136727.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(51777.5820, grad_fn=<MseLossBackward>)
output :  tensor([[167761.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(17128864., grad_fn=<MseLossBackward>)
output :  tensor([[175523.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(29991196., grad_fn=<MseLossBackward>)
output :  tensor([[114639.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(130039.1250, grad_fn=<MseLossBackward>)
output :  tensor([[222439.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2070945.8750, grad_fn=<MseLossBackward>)
output :  tensor([[186185.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(7214428., grad_fn=<MseLossBackward>)
output :  tensor([[125608.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(11756.9971, grad_fn=<MseLossBackward>)
output :  tensor([[198278.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3162284.2500, grad_fn=<MseLossBackward>)
output :  tensor([[177283.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(5682636.5000, grad_fn=<MseLossBackward>)
output :  tensor([[207268.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2035e+10, grad_fn=<MseLossBackward>)
output :  tensor([[206516.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(20103594., grad_fn=<MseLossBackward>)
output :  tensor([[170737.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5791e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195288.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(622126.5625, grad_fn=<MseLossBackward>)
output :  tensor([[113296.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(88139.4062, grad_fn=<MseLossBackward>)
output :  tensor([[114995.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(6228456., grad_fn=<MseLossBackward>)
output :  tensor([[112952.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(906899.1250, grad_fn=<MseLossBackward>)
output :  tensor([[147149.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(122128.4062, grad_fn=<MseLossBackward>)
output :  tensor([[158986.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3730e+10, grad_fn=<MseLossBackward>)
output :  tensor([[178702.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1683222.3750, grad_fn=<MseLossBackward>)
output :  tensor([[127433.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(4439.9316, grad_fn=<MseLossBackward>)
output :  tensor([[144057.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(888070.6250, grad_fn=<MseLossBackward>)
output :  tensor([[187579.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7751e+09, grad_fn=<MseLossBackward>)
output :  tensor([[116320.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(335458.1562, grad_fn=<MseLossBackward>)
output :  tensor([[200245.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(10535400., grad_fn=<MseLossBackward>)
output :  tensor([[143563.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2062589.6250, grad_fn=<MseLossBackward>)
output :  tensor([[213778.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(770993.7500, grad_fn=<MseLossBackward>)
output :  tensor([[128242.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(5028315.5000, grad_fn=<MseLossBackward>)
output :  tensor([[245748.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(6651966.5000, grad_fn=<MseLossBackward>)
output :  tensor([[233342.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6684e+09, grad_fn=<MseLossBackward>)
output :  tensor([[152274.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3575e+08, grad_fn=<MseLossBackward>)
output :  tensor([[84841.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6841e+08, grad_fn=<MseLossBackward>)
output :  tensor([[187404.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6554e+09, grad_fn=<MseLossBackward>)
output :  tensor([[82205.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(1452834.7500, grad_fn=<MseLossBackward>)
output :  tensor([[140036.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(288318.6562, grad_fn=<MseLossBackward>)
output :  tensor([[78030.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(6401137., grad_fn=<MseLossBackward>)
output :  tensor([[142010.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(888571.3750, grad_fn=<MseLossBackward>)
output :  tensor([[174924.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1155860.1250, grad_fn=<MseLossBackward>)
output :  tensor([[153048.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(203922.7969, grad_fn=<MseLossBackward>)
output :  tensor([[110059.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(7074353., grad_fn=<MseLossBackward>)
output :  tensor([[202778.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2762e+10, grad_fn=<MseLossBackward>)
output :  tensor([[126095.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(5782334., grad_fn=<MseLossBackward>)
output :  tensor([[267523.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5567e+08, grad_fn=<MseLossBackward>)
output :  tensor([[302351.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(58497164., grad_fn=<MseLossBackward>)
output :  tensor([[105608.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(3577949.5000, grad_fn=<MseLossBackward>)
output :  tensor([[169145.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(11252461., grad_fn=<MseLossBackward>)
output :  tensor([[133608.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5578e+08, grad_fn=<MseLossBackward>)
output :  tensor([[143607.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(21230496., grad_fn=<MseLossBackward>)
output :  tensor([[128939.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(1716611.7500, grad_fn=<MseLossBackward>)
output :  tensor([[124709.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(84177.0469, grad_fn=<MseLossBackward>)
output :  tensor([[134489.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2445e+08, grad_fn=<MseLossBackward>)
output :  tensor([[225721.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8919e+10, grad_fn=<MseLossBackward>)
output :  tensor([[188398.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3287e+10, grad_fn=<MseLossBackward>)
output :  tensor([[146934.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(9206768., grad_fn=<MseLossBackward>)
output :  tensor([[131186.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(13591550., grad_fn=<MseLossBackward>)
output :  tensor([[115685.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(19676086., grad_fn=<MseLossBackward>)
output :  tensor([[250349.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5848e+09, grad_fn=<MseLossBackward>)
output :  tensor([[135799.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(638550.8125, grad_fn=<MseLossBackward>)
output :  tensor([[206926.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(15414458., grad_fn=<MseLossBackward>)
output :  tensor([[99164.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(32901516., grad_fn=<MseLossBackward>)
output :  tensor([[141151.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1442588.6250, grad_fn=<MseLossBackward>)
output :  tensor([[202055.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0376e+08, grad_fn=<MseLossBackward>)
output :  tensor([[182237.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(5465805.5000, grad_fn=<MseLossBackward>)
output :  tensor([[184303.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(485046.9688, grad_fn=<MseLossBackward>)
output :  tensor([[163313.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1225e+10, grad_fn=<MseLossBackward>)
output :  tensor([[293401.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7304e+09, grad_fn=<MseLossBackward>)
output :  tensor([[198369.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(220048.9531, grad_fn=<MseLossBackward>)
output :  tensor([[260875.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0160e+10, grad_fn=<MseLossBackward>)
output :  tensor([[214197.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6835e+09, grad_fn=<MseLossBackward>)
output :  tensor([[273764.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8693e+09, grad_fn=<MseLossBackward>)
output :  tensor([[226216.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(4910933., grad_fn=<MseLossBackward>)
output :  tensor([[219651.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9704e+10, grad_fn=<MseLossBackward>)
output :  tensor([[200135.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(9834398., grad_fn=<MseLossBackward>)
output :  tensor([[160387.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(9.8516e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130258.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(5022956.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135865.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(133418.9844, grad_fn=<MseLossBackward>)
output :  tensor([[91454.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(206868.6250, grad_fn=<MseLossBackward>)
output :  tensor([[107557.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(195509.0625, grad_fn=<MseLossBackward>)
output :  tensor([[272516.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1791e+09, grad_fn=<MseLossBackward>)
output :  tensor([[235370.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(137270.2500, grad_fn=<MseLossBackward>)
output :  tensor([[142521.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(6144356.5000, grad_fn=<MseLossBackward>)
output :  tensor([[136255.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1548041.3750, grad_fn=<MseLossBackward>)
output :  tensor([[173095.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(405868.5312, grad_fn=<MseLossBackward>)
output :  tensor([[146803.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2414042., grad_fn=<MseLossBackward>)
output :  tensor([[164265.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(9.1412e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165985.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(971579.8750, grad_fn=<MseLossBackward>)
output :  tensor([[139425.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(5882368., grad_fn=<MseLossBackward>)
output :  tensor([[191204.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7203e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113762.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(3106709.2500, grad_fn=<MseLossBackward>)
output :  tensor([[168966.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(9202975., grad_fn=<MseLossBackward>)
output :  tensor([[118652.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1814787.8750, grad_fn=<MseLossBackward>)
output :  tensor([[89416.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(5838188.5000, grad_fn=<MseLossBackward>)
output :  tensor([[179349.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(422967.3125, grad_fn=<MseLossBackward>)
output :  tensor([[111526.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2646417.2500, grad_fn=<MseLossBackward>)
output :  tensor([[241230.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(4977012.5000, grad_fn=<MseLossBackward>)
output :  tensor([[244276.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(523881.9062, grad_fn=<MseLossBackward>)
output :  tensor([[133132.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(13195964., grad_fn=<MseLossBackward>)
output :  tensor([[113169.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(17724494., grad_fn=<MseLossBackward>)
output :  tensor([[286809.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2603e+10, grad_fn=<MseLossBackward>)
output :  tensor([[173804.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(5312160.5000, grad_fn=<MseLossBackward>)
output :  tensor([[125320.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(102965.7812, grad_fn=<MseLossBackward>)
output :  tensor([[148114.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(9.0688e+08, grad_fn=<MseLossBackward>)
output :  tensor([[194660.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7402e+08, grad_fn=<MseLossBackward>)
output :  tensor([[141784.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(615268.6250, grad_fn=<MseLossBackward>)
output :  tensor([[156990.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5131e+10, grad_fn=<MseLossBackward>)
output :  tensor([[148544.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(28684894., grad_fn=<MseLossBackward>)
output :  tensor([[129424.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(5680.2129, grad_fn=<MseLossBackward>)
output :  tensor([[240575.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9023e+10, grad_fn=<MseLossBackward>)
output :  tensor([[399561.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(5946892., grad_fn=<MseLossBackward>)
output :  tensor([[103700.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(28080892., grad_fn=<MseLossBackward>)
output :  tensor([[120964.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(6071373., grad_fn=<MseLossBackward>)
output :  tensor([[160200.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(490656.4688, grad_fn=<MseLossBackward>)
output :  tensor([[133710.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1168e+08, grad_fn=<MseLossBackward>)
output :  tensor([[162197.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5763e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173598.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0448e+09, grad_fn=<MseLossBackward>)
output :  tensor([[103867.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(71748.6484, grad_fn=<MseLossBackward>)
output :  tensor([[140912.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(7623.4727, grad_fn=<MseLossBackward>)
output :  tensor([[365293.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(4002125.2500, grad_fn=<MseLossBackward>)
output :  tensor([[200833.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8267e+09, grad_fn=<MseLossBackward>)
output :  tensor([[176677.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1385807.2500, grad_fn=<MseLossBackward>)
output :  tensor([[205401.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(6258987.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139089.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(8060.6729, grad_fn=<MseLossBackward>)
output :  tensor([[194378.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(14800.2432, grad_fn=<MseLossBackward>)
output :  tensor([[137755.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(9.1541e+08, grad_fn=<MseLossBackward>)
output :  tensor([[182327.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1761302.2500, grad_fn=<MseLossBackward>)
output :  tensor([[236856.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(26455110., grad_fn=<MseLossBackward>)
output :  tensor([[175296.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1681398.5000, grad_fn=<MseLossBackward>)
output :  tensor([[104910.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(9545638., grad_fn=<MseLossBackward>)
output :  tensor([[265138.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(333361.8750, grad_fn=<MseLossBackward>)
output :  tensor([[251674.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2803845.5000, grad_fn=<MseLossBackward>)
output :  tensor([[123220.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(48720.2148, grad_fn=<MseLossBackward>)
output :  tensor([[211883.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9837e+09, grad_fn=<MseLossBackward>)
output :  tensor([[298457.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2050e+08, grad_fn=<MseLossBackward>)
output :  tensor([[208063.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1130434.1250, grad_fn=<MseLossBackward>)
output :  tensor([[212985.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6133e+10, grad_fn=<MseLossBackward>)
output :  tensor([[159182.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1643724.3750, grad_fn=<MseLossBackward>)
output :  tensor([[168013.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3906922.7500, grad_fn=<MseLossBackward>)
output :  tensor([[162253.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(28320358., grad_fn=<MseLossBackward>)
output :  tensor([[167629.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(5621048.5000, grad_fn=<MseLossBackward>)
output :  tensor([[233333.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2018e+09, grad_fn=<MseLossBackward>)
output :  tensor([[205850.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5720e+08, grad_fn=<MseLossBackward>)
output :  tensor([[162232.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3202e+08, grad_fn=<MseLossBackward>)
output :  tensor([[123106.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(11299.0254, grad_fn=<MseLossBackward>)
output :  tensor([[177108.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(11738.3682, grad_fn=<MseLossBackward>)
output :  tensor([[179036.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5551e+09, grad_fn=<MseLossBackward>)
output :  tensor([[201609.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7252e+10, grad_fn=<MseLossBackward>)
output :  tensor([[132310.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(4499569., grad_fn=<MseLossBackward>)
output :  tensor([[152778.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(9.7212e+08, grad_fn=<MseLossBackward>)
output :  tensor([[275993.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1013986.0625, grad_fn=<MseLossBackward>)
output :  tensor([[87055.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(4225562., grad_fn=<MseLossBackward>)
output :  tensor([[236759.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(67332.1406, grad_fn=<MseLossBackward>)
output :  tensor([[254951.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0757e+11, grad_fn=<MseLossBackward>)
output :  tensor([[169653.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(119921.5234, grad_fn=<MseLossBackward>)
output :  tensor([[190470.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9828e+09, grad_fn=<MseLossBackward>)
output :  tensor([[156317.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1735723.8750, grad_fn=<MseLossBackward>)
output :  tensor([[204373.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3068e+09, grad_fn=<MseLossBackward>)
output :  tensor([[128017.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(965736.1250, grad_fn=<MseLossBackward>)
output :  tensor([[150546.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(30759156., grad_fn=<MseLossBackward>)
output :  tensor([[171664.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5054e+08, grad_fn=<MseLossBackward>)
output :  tensor([[187443.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2540786.2500, grad_fn=<MseLossBackward>)
output :  tensor([[125709.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(84122.6562, grad_fn=<MseLossBackward>)
output :  tensor([[137373.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(763439.0625, grad_fn=<MseLossBackward>)
output :  tensor([[172501.]], grad_fn=<AddmmBackward>)
loss:  tensor(249001., grad_fn=<MseLossBackward>)
output :  tensor([[198404.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6621e+09, grad_fn=<MseLossBackward>)
output :  tensor([[240583.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(5840454., grad_fn=<MseLossBackward>)
output :  tensor([[150612.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(19249196., grad_fn=<MseLossBackward>)
output :  tensor([[198780.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(7733092., grad_fn=<MseLossBackward>)
output :  tensor([[164392.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1585e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177257.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(5030909., grad_fn=<MseLossBackward>)
output :  tensor([[181085.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1404817.5000, grad_fn=<MseLossBackward>)
output :  tensor([[97971.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(944738.4375, grad_fn=<MseLossBackward>)
output :  tensor([[170551.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1979e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134072.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(860314.2500, grad_fn=<MseLossBackward>)
output :  tensor([[122752.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(60095684., grad_fn=<MseLossBackward>)
output :  tensor([[173495.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(254662.1562, grad_fn=<MseLossBackward>)
output :  tensor([[86728.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(2987793.2500, grad_fn=<MseLossBackward>)
output :  tensor([[290387.]], grad_fn=<AddmmBackward>)
loss:  tensor(149769., grad_fn=<MseLossBackward>)
output :  tensor([[167709.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(7339527.5000, grad_fn=<MseLossBackward>)
output :  tensor([[190307.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0409e+10, grad_fn=<MseLossBackward>)
output :  tensor([[239877.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6858e+08, grad_fn=<MseLossBackward>)
output :  tensor([[149256.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(3040173.7500, grad_fn=<MseLossBackward>)
output :  tensor([[121003.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(8979949., grad_fn=<MseLossBackward>)
output :  tensor([[121750.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(3422789., grad_fn=<MseLossBackward>)
output :  tensor([[144139.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4909e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173473.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(276774.6250, grad_fn=<MseLossBackward>)
output :  tensor([[113643.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6994e+08, grad_fn=<MseLossBackward>)
output :  tensor([[204470.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2889e+10, grad_fn=<MseLossBackward>)
output :  tensor([[246174.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(21853434., grad_fn=<MseLossBackward>)
output :  tensor([[247168.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1911e+10, grad_fn=<MseLossBackward>)
output :  tensor([[218514.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1967e+08, grad_fn=<MseLossBackward>)
output :  tensor([[191862.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5286e+10, grad_fn=<MseLossBackward>)
output :  tensor([[187430.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(4858.5254, grad_fn=<MseLossBackward>)
output :  tensor([[205088.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8304e+10, grad_fn=<MseLossBackward>)
output :  tensor([[185350.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2695e+10, grad_fn=<MseLossBackward>)
output :  tensor([[175934.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(7873022., grad_fn=<MseLossBackward>)
output :  tensor([[149685.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(5358574., grad_fn=<MseLossBackward>)
output :  tensor([[336235.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(584699.1875, grad_fn=<MseLossBackward>)
output :  tensor([[208152.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(14806743., grad_fn=<MseLossBackward>)
output :  tensor([[162985.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(8912744., grad_fn=<MseLossBackward>)
output :  tensor([[182031.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5365e+09, grad_fn=<MseLossBackward>)
output :  tensor([[105321.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(103066.0781, grad_fn=<MseLossBackward>)
output :  tensor([[269236.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1661e+10, grad_fn=<MseLossBackward>)
output :  tensor([[171018.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(8305113.5000, grad_fn=<MseLossBackward>)
output :  tensor([[212629.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(757498.2500, grad_fn=<MseLossBackward>)
output :  tensor([[200534.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1884e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180164.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(930230.1250, grad_fn=<MseLossBackward>)
output :  tensor([[201273.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(277399.7188, grad_fn=<MseLossBackward>)
output :  tensor([[155115.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(13343.8594, grad_fn=<MseLossBackward>)
output :  tensor([[153939.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9095e+09, grad_fn=<MseLossBackward>)
output :  tensor([[120842.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(5486501., grad_fn=<MseLossBackward>)
output :  tensor([[141802.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(3250696.2500, grad_fn=<MseLossBackward>)
output :  tensor([[149531.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(282824.5312, grad_fn=<MseLossBackward>)
output :  tensor([[202457.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5761e+10, grad_fn=<MseLossBackward>)
output :  tensor([[161118.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2619188.2500, grad_fn=<MseLossBackward>)
output :  tensor([[103507.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(16059054., grad_fn=<MseLossBackward>)
output :  tensor([[223910.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5887e+08, grad_fn=<MseLossBackward>)
output :  tensor([[186599.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4520e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174279.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(4862645., grad_fn=<MseLossBackward>)
output :  tensor([[81426.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(328857.4375, grad_fn=<MseLossBackward>)
output :  tensor([[131220.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(7400780., grad_fn=<MseLossBackward>)
output :  tensor([[216255.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(5087491.5000, grad_fn=<MseLossBackward>)
output :  tensor([[143718.]], grad_fn=<AddmmBackward>)
loss:  tensor(79524., grad_fn=<MseLossBackward>)
output :  tensor([[132029.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(4120138.7500, grad_fn=<MseLossBackward>)
output :  tensor([[145104.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(6272990., grad_fn=<MseLossBackward>)
output :  tensor([[179287.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7462e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144868.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(753478.2500, grad_fn=<MseLossBackward>)
output :  tensor([[160022.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(528.2815, grad_fn=<MseLossBackward>)
output :  tensor([[214089.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(829038.6875, grad_fn=<MseLossBackward>)
output :  tensor([[138982.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1548e+09, grad_fn=<MseLossBackward>)
output :  tensor([[258462.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(11990205., grad_fn=<MseLossBackward>)
output :  tensor([[158084.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2004392.2500, grad_fn=<MseLossBackward>)
output :  tensor([[130199.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2887503.7500, grad_fn=<MseLossBackward>)
output :  tensor([[94661.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(114651.0156, grad_fn=<MseLossBackward>)
output :  tensor([[155937.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1033e+09, grad_fn=<MseLossBackward>)
output :  tensor([[181392.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(2227509.5000, grad_fn=<MseLossBackward>)
output :  tensor([[118365.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(4554823., grad_fn=<MseLossBackward>)
output :  tensor([[186096.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8364e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145145.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3093e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150611.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(505787.6562, grad_fn=<MseLossBackward>)
output :  tensor([[188659.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(826764., grad_fn=<MseLossBackward>)
output :  tensor([[251358.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7404e+09, grad_fn=<MseLossBackward>)
output :  tensor([[90599.1016]], grad_fn=<AddmmBackward>)
loss:  tensor(811618., grad_fn=<MseLossBackward>)
output :  tensor([[240049.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2456.4414, grad_fn=<MseLossBackward>)
output :  tensor([[128526.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(708.0588, grad_fn=<MseLossBackward>)
output :  tensor([[165282.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0124e+10, grad_fn=<MseLossBackward>)
output :  tensor([[114515.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1069e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175574.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(181369.5156, grad_fn=<MseLossBackward>)
output :  tensor([[165113.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6116e+08, grad_fn=<MseLossBackward>)
output :  tensor([[155619.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3097e+08, grad_fn=<MseLossBackward>)
output :  tensor([[236027.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(8834827., grad_fn=<MseLossBackward>)
output :  tensor([[229728.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9926e+08, grad_fn=<MseLossBackward>)
output :  tensor([[125427.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(2472731.7500, grad_fn=<MseLossBackward>)
output :  tensor([[124704.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1678198.7500, grad_fn=<MseLossBackward>)
output :  tensor([[221828.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(26739402., grad_fn=<MseLossBackward>)
output :  tensor([[226697.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(53323312., grad_fn=<MseLossBackward>)
output :  tensor([[227831.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1279903.3750, grad_fn=<MseLossBackward>)
output :  tensor([[149597.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2551507., grad_fn=<MseLossBackward>)
output :  tensor([[210256.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(66040.9688, grad_fn=<MseLossBackward>)
output :  tensor([[131998.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4395e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131789.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(505010.0938, grad_fn=<MseLossBackward>)
output :  tensor([[306005.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(80905528., grad_fn=<MseLossBackward>)
output :  tensor([[137568.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(11772833., grad_fn=<MseLossBackward>)
output :  tensor([[120566.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8694e+09, grad_fn=<MseLossBackward>)
output :  tensor([[106064.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(11805291., grad_fn=<MseLossBackward>)
output :  tensor([[153342.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6701e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179896.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(8.9925e+09, grad_fn=<MseLossBackward>)
output :  tensor([[176300.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(10892166., grad_fn=<MseLossBackward>)
output :  tensor([[189293.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3705e+08, grad_fn=<MseLossBackward>)
output :  tensor([[96938.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(9371539., grad_fn=<MseLossBackward>)
output :  tensor([[176470.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(6399398., grad_fn=<MseLossBackward>)
output :  tensor([[170565.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(7105306.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139984.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(969147.9375, grad_fn=<MseLossBackward>)
output :  tensor([[259133.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9933e+09, grad_fn=<MseLossBackward>)
output :  tensor([[142511.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3075e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173599.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(359737.5625, grad_fn=<MseLossBackward>)
output :  tensor([[139768.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(53462.1094, grad_fn=<MseLossBackward>)
output :  tensor([[194944.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(30860976., grad_fn=<MseLossBackward>)
output :  tensor([[168022.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(3911989.5000, grad_fn=<MseLossBackward>)
output :  tensor([[240642.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(11271652., grad_fn=<MseLossBackward>)
output :  tensor([[134164.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(112486.8750, grad_fn=<MseLossBackward>)
output :  tensor([[150957.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2584207., grad_fn=<MseLossBackward>)
output :  tensor([[211539.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(11974087., grad_fn=<MseLossBackward>)
output :  tensor([[165837.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(701877.4375, grad_fn=<MseLossBackward>)
output :  tensor([[191447.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(5990256., grad_fn=<MseLossBackward>)
output :  tensor([[133915.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2925e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128231.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(590436.1875, grad_fn=<MseLossBackward>)
output :  tensor([[138827.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1375599.1250, grad_fn=<MseLossBackward>)
output :  tensor([[196065.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3927e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164450.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4453e+09, grad_fn=<MseLossBackward>)
output :  tensor([[77314.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9981e+08, grad_fn=<MseLossBackward>)
output :  tensor([[91969.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(55794832., grad_fn=<MseLossBackward>)
output :  tensor([[258487.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(26981370., grad_fn=<MseLossBackward>)
output :  tensor([[201830.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9477e+09, grad_fn=<MseLossBackward>)
output :  tensor([[115002.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0943, grad_fn=<MseLossBackward>)
output :  tensor([[155638.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0152e+09, grad_fn=<MseLossBackward>)
output :  tensor([[204489.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4058e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178344.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4007e+09, grad_fn=<MseLossBackward>)
output :  tensor([[155569.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(323814.3438, grad_fn=<MseLossBackward>)
output :  tensor([[171159.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1344295.3750, grad_fn=<MseLossBackward>)
output :  tensor([[118381.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(11437607., grad_fn=<MseLossBackward>)
output :  tensor([[163270.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(68398848., grad_fn=<MseLossBackward>)
output :  tensor([[192260.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1432e+08, grad_fn=<MseLossBackward>)
output :  tensor([[218598.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(813124.8750, grad_fn=<MseLossBackward>)
output :  tensor([[244844.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5016e+11, grad_fn=<MseLossBackward>)
output :  tensor([[148403.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1970908.8750, grad_fn=<MseLossBackward>)
output :  tensor([[110531.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(4209710., grad_fn=<MseLossBackward>)
output :  tensor([[170474.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3054e+08, grad_fn=<MseLossBackward>)
output :  tensor([[150666.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(27842.0508, grad_fn=<MseLossBackward>)
output :  tensor([[235239.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(3098150., grad_fn=<MseLossBackward>)
output :  tensor([[115503.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(253732.5781, grad_fn=<MseLossBackward>)
output :  tensor([[183845.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(894620.3750, grad_fn=<MseLossBackward>)
output :  tensor([[184598.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(4416827.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162188.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4904e+10, grad_fn=<MseLossBackward>)
output :  tensor([[96554.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4195e+08, grad_fn=<MseLossBackward>)
output :  tensor([[239361.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(130840.4531, grad_fn=<MseLossBackward>)
output :  tensor([[177036.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1074008.3750, grad_fn=<MseLossBackward>)
output :  tensor([[138558.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2077561.8750, grad_fn=<MseLossBackward>)
output :  tensor([[233109.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(3573163.2500, grad_fn=<MseLossBackward>)
output :  tensor([[164735.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(3013587.5000, grad_fn=<MseLossBackward>)
output :  tensor([[198508.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6000e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134555.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(197149.8750, grad_fn=<MseLossBackward>)
output :  tensor([[185243.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4027e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137316.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1734406.7500, grad_fn=<MseLossBackward>)
output :  tensor([[221810.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0135e+08, grad_fn=<MseLossBackward>)
output :  tensor([[221500.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1222e+08, grad_fn=<MseLossBackward>)
output :  tensor([[88516.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(2199451.2500, grad_fn=<MseLossBackward>)
output :  tensor([[158684.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(561539.5000, grad_fn=<MseLossBackward>)
output :  tensor([[242355.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6518e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145914.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(837196.4375, grad_fn=<MseLossBackward>)
output :  tensor([[111387.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9702e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163974.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(276215.9375, grad_fn=<MseLossBackward>)
output :  tensor([[141752.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(5051818., grad_fn=<MseLossBackward>)
output :  tensor([[127637.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(315958.1562, grad_fn=<MseLossBackward>)
output :  tensor([[188728.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9380e+09, grad_fn=<MseLossBackward>)
output :  tensor([[123700.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(1440506.2500, grad_fn=<MseLossBackward>)
output :  tensor([[151524.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(226100.2500, grad_fn=<MseLossBackward>)
output :  tensor([[168859.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(8355261., grad_fn=<MseLossBackward>)
output :  tensor([[152381.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1908412.7500, grad_fn=<MseLossBackward>)
output :  tensor([[157948.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(24515340., grad_fn=<MseLossBackward>)
output :  tensor([[135463.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0032e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131966.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1090.0315, grad_fn=<MseLossBackward>)
output :  tensor([[157309.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3524e+08, grad_fn=<MseLossBackward>)
output :  tensor([[144100.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2613.7656, grad_fn=<MseLossBackward>)
output :  tensor([[161801.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2689.3948, grad_fn=<MseLossBackward>)
output :  tensor([[143806.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1496e+09, grad_fn=<MseLossBackward>)
output :  tensor([[149354.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(307938.2812, grad_fn=<MseLossBackward>)
output :  tensor([[184679.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(11027899., grad_fn=<MseLossBackward>)
output :  tensor([[170000.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1001438., grad_fn=<MseLossBackward>)
output :  tensor([[177917.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(4335505., grad_fn=<MseLossBackward>)
output :  tensor([[220966.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(933820.2500, grad_fn=<MseLossBackward>)
output :  tensor([[114336.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(41431148., grad_fn=<MseLossBackward>)
output :  tensor([[141652.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8063e+08, grad_fn=<MseLossBackward>)
output :  tensor([[284023.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3905811., grad_fn=<MseLossBackward>)
output :  tensor([[114959.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1083616., grad_fn=<MseLossBackward>)
output :  tensor([[177807.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7802e+09, grad_fn=<MseLossBackward>)
output :  tensor([[186372.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1884056.5000, grad_fn=<MseLossBackward>)
output :  tensor([[172791.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6151e+08, grad_fn=<MseLossBackward>)
output :  tensor([[252340.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1345e+08, grad_fn=<MseLossBackward>)
output :  tensor([[222337.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(114212.3125, grad_fn=<MseLossBackward>)
output :  tensor([[135787.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(8.9324e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177515.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0099e+08, grad_fn=<MseLossBackward>)
output :  tensor([[122596.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1971084.3750, grad_fn=<MseLossBackward>)
output :  tensor([[181303.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6294e+10, grad_fn=<MseLossBackward>)
output :  tensor([[153822.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(676686.1875, grad_fn=<MseLossBackward>)
output :  tensor([[157348.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1768e+08, grad_fn=<MseLossBackward>)
output :  tensor([[204012.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(5233085., grad_fn=<MseLossBackward>)
output :  tensor([[144562.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4551e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175952.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2301.0010, grad_fn=<MseLossBackward>)
output :  tensor([[247693.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0116e+09, grad_fn=<MseLossBackward>)
output :  tensor([[148692.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(480054.1250, grad_fn=<MseLossBackward>)
output :  tensor([[201074.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2529441.7500, grad_fn=<MseLossBackward>)
output :  tensor([[154714.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(27406534., grad_fn=<MseLossBackward>)
output :  tensor([[128584.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6471e+09, grad_fn=<MseLossBackward>)
output :  tensor([[135472.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(77257.9375, grad_fn=<MseLossBackward>)
output :  tensor([[179606.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(19301744., grad_fn=<MseLossBackward>)
output :  tensor([[192797.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(7824695., grad_fn=<MseLossBackward>)
output :  tensor([[215680.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3757e+09, grad_fn=<MseLossBackward>)
output :  tensor([[255521.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2187210., grad_fn=<MseLossBackward>)
output :  tensor([[176030.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0440e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145491.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9151e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137928.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(43183380., grad_fn=<MseLossBackward>)
output :  tensor([[72574.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0611e+09, grad_fn=<MseLossBackward>)
output :  tensor([[132959.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(4162875., grad_fn=<MseLossBackward>)
output :  tensor([[130070.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1370180., grad_fn=<MseLossBackward>)
output :  tensor([[157196.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(10215515., grad_fn=<MseLossBackward>)
output :  tensor([[129309.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(5334331.5000, grad_fn=<MseLossBackward>)
output :  tensor([[77319.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(671938.8125, grad_fn=<MseLossBackward>)
output :  tensor([[84116.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(4479407., grad_fn=<MseLossBackward>)
output :  tensor([[220864.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2401e+08, grad_fn=<MseLossBackward>)
output :  tensor([[142022.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7159e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130981.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(231391.0625, grad_fn=<MseLossBackward>)
output :  tensor([[168439.]], grad_fn=<AddmmBackward>)
loss:  tensor(2070721., grad_fn=<MseLossBackward>)
output :  tensor([[235853.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(728462.2500, grad_fn=<MseLossBackward>)
output :  tensor([[188512.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(13156603., grad_fn=<MseLossBackward>)
output :  tensor([[162126.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(37538404., grad_fn=<MseLossBackward>)
output :  tensor([[199696.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(3225672.2500, grad_fn=<MseLossBackward>)
output :  tensor([[198332.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4952e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137000.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(0.2659, grad_fn=<MseLossBackward>)
output :  tensor([[154002.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(995567.4375, grad_fn=<MseLossBackward>)
output :  tensor([[135579.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(176846.5312, grad_fn=<MseLossBackward>)
output :  tensor([[196758.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1050e+09, grad_fn=<MseLossBackward>)
output :  tensor([[152330.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2787699.7500, grad_fn=<MseLossBackward>)
output :  tensor([[139332.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1006e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146639.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3024229.7500, grad_fn=<MseLossBackward>)
output :  tensor([[206873.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(26276516., grad_fn=<MseLossBackward>)
output :  tensor([[104959.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2714e+08, grad_fn=<MseLossBackward>)
output :  tensor([[167098.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(161315.1875, grad_fn=<MseLossBackward>)
output :  tensor([[128915.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(838111.6250, grad_fn=<MseLossBackward>)
output :  tensor([[146436.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(318078.3750, grad_fn=<MseLossBackward>)
output :  tensor([[105021.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8180e+09, grad_fn=<MseLossBackward>)
output :  tensor([[141341.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(14759523., grad_fn=<MseLossBackward>)
output :  tensor([[228781.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(52113508., grad_fn=<MseLossBackward>)
output :  tensor([[145892.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(796639.9375, grad_fn=<MseLossBackward>)
output :  tensor([[141001.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(12261378., grad_fn=<MseLossBackward>)
output :  tensor([[168573.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6462e+09, grad_fn=<MseLossBackward>)
output :  tensor([[260704.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9913e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173808.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1420119.1250, grad_fn=<MseLossBackward>)
output :  tensor([[103748.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(946333.7500, grad_fn=<MseLossBackward>)
output :  tensor([[198202.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2881e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159986.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(973182.2500, grad_fn=<MseLossBackward>)
output :  tensor([[161478.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6633e+10, grad_fn=<MseLossBackward>)
output :  tensor([[100520.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(4931765.5000, grad_fn=<MseLossBackward>)
output :  tensor([[121572.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(4111991.7500, grad_fn=<MseLossBackward>)
output :  tensor([[158038.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(4155291.2500, grad_fn=<MseLossBackward>)
output :  tensor([[142734.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(7477063., grad_fn=<MseLossBackward>)
output :  tensor([[201652.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2731634.2500, grad_fn=<MseLossBackward>)
output :  tensor([[143446.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2091819.8750, grad_fn=<MseLossBackward>)
output :  tensor([[260875.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1971259.8750, grad_fn=<MseLossBackward>)
output :  tensor([[128805.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2820e+09, grad_fn=<MseLossBackward>)
output :  tensor([[162035.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(12002002., grad_fn=<MseLossBackward>)
output :  tensor([[187463.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1073878.8750, grad_fn=<MseLossBackward>)
output :  tensor([[122817.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6428e+08, grad_fn=<MseLossBackward>)
output :  tensor([[246531.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(12028650., grad_fn=<MseLossBackward>)
output :  tensor([[155746.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(9.7676e+08, grad_fn=<MseLossBackward>)
output :  tensor([[245385.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1232.6682, grad_fn=<MseLossBackward>)
output :  tensor([[146184.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(4771494., grad_fn=<MseLossBackward>)
output :  tensor([[211927.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3715738.2500, grad_fn=<MseLossBackward>)
output :  tensor([[175610.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(10309819., grad_fn=<MseLossBackward>)
output :  tensor([[154334.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(111952.9766, grad_fn=<MseLossBackward>)
output :  tensor([[117444.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(308667.0625, grad_fn=<MseLossBackward>)
output :  tensor([[232801.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9473e+09, grad_fn=<MseLossBackward>)
output :  tensor([[236125.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(15008966., grad_fn=<MseLossBackward>)
output :  tensor([[149013.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(18689816., grad_fn=<MseLossBackward>)
output :  tensor([[254029.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(757171.8750, grad_fn=<MseLossBackward>)
output :  tensor([[120906.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(40990404., grad_fn=<MseLossBackward>)
output :  tensor([[177759.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(3095455.2500, grad_fn=<MseLossBackward>)
output :  tensor([[164381.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(19200554., grad_fn=<MseLossBackward>)
output :  tensor([[132663.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2765621., grad_fn=<MseLossBackward>)
output :  tensor([[197940.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6840e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164714.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(510599.5625, grad_fn=<MseLossBackward>)
output :  tensor([[167020.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(16162284., grad_fn=<MseLossBackward>)
output :  tensor([[157440.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(313477.5000, grad_fn=<MseLossBackward>)
output :  tensor([[147929.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(3883609.2500, grad_fn=<MseLossBackward>)
output :  tensor([[173601.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1090e+09, grad_fn=<MseLossBackward>)
output :  tensor([[160977.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(955811.7500, grad_fn=<MseLossBackward>)
output :  tensor([[371872.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4635e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128853.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(3434159.2500, grad_fn=<MseLossBackward>)
output :  tensor([[130756.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0481e+09, grad_fn=<MseLossBackward>)
output :  tensor([[278855.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(5559427., grad_fn=<MseLossBackward>)
output :  tensor([[158678.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(11033193., grad_fn=<MseLossBackward>)
output :  tensor([[134375.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9253e+08, grad_fn=<MseLossBackward>)
output :  tensor([[226228.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(33307688., grad_fn=<MseLossBackward>)
output :  tensor([[181308.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(653798.5625, grad_fn=<MseLossBackward>)
output :  tensor([[156614.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(21293610., grad_fn=<MseLossBackward>)
output :  tensor([[143999.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1001250.3750, grad_fn=<MseLossBackward>)
output :  tensor([[156043.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6648e+08, grad_fn=<MseLossBackward>)
output :  tensor([[102069.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(4284221., grad_fn=<MseLossBackward>)
output :  tensor([[84057.]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7874e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163283.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2945835.7500, grad_fn=<MseLossBackward>)
output :  tensor([[186538.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7190e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159616.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2612011.5000, grad_fn=<MseLossBackward>)
output :  tensor([[153215.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(18353594., grad_fn=<MseLossBackward>)
output :  tensor([[136708.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(549590.5625, grad_fn=<MseLossBackward>)
output :  tensor([[207437.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2213446.5000, grad_fn=<MseLossBackward>)
output :  tensor([[137417.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(339634., grad_fn=<MseLossBackward>)
output :  tensor([[182257.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6318e+10, grad_fn=<MseLossBackward>)
output :  tensor([[149677.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(13526190., grad_fn=<MseLossBackward>)
output :  tensor([[110771.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7125e+08, grad_fn=<MseLossBackward>)
output :  tensor([[96110.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(4455859., grad_fn=<MseLossBackward>)
output :  tensor([[172433.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(6589248.5000, grad_fn=<MseLossBackward>)
output :  tensor([[267593.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(51742396., grad_fn=<MseLossBackward>)
output :  tensor([[140701.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(636828.9375, grad_fn=<MseLossBackward>)
output :  tensor([[156940.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(8726578., grad_fn=<MseLossBackward>)
output :  tensor([[132733.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(54442.0156, grad_fn=<MseLossBackward>)
output :  tensor([[150074.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(330481.2500, grad_fn=<MseLossBackward>)
output :  tensor([[167028.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(758695.4375, grad_fn=<MseLossBackward>)
output :  tensor([[128074.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(1153526.3750, grad_fn=<MseLossBackward>)
output :  tensor([[175998.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6089e+08, grad_fn=<MseLossBackward>)
output :  tensor([[157270.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(73060.3984, grad_fn=<MseLossBackward>)
output :  tensor([[117388.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(789043.5625, grad_fn=<MseLossBackward>)
output :  tensor([[158362.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5708e+09, grad_fn=<MseLossBackward>)
output :  tensor([[52529.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(279874.0625, grad_fn=<MseLossBackward>)
output :  tensor([[232473.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4042e+09, grad_fn=<MseLossBackward>)
output :  tensor([[200453.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(298389.0625, grad_fn=<MseLossBackward>)
output :  tensor([[182612.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(5701126., grad_fn=<MseLossBackward>)
output :  tensor([[105769.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(53007.8672, grad_fn=<MseLossBackward>)
output :  tensor([[86003.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(992545.1875, grad_fn=<MseLossBackward>)
output :  tensor([[135046.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(24535924., grad_fn=<MseLossBackward>)
output :  tensor([[217568.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8417e+09, grad_fn=<MseLossBackward>)
output :  tensor([[199388.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(65795672., grad_fn=<MseLossBackward>)
output :  tensor([[171418.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(41201956., grad_fn=<MseLossBackward>)
output :  tensor([[170527.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(8.9250e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192586.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(6691518., grad_fn=<MseLossBackward>)
output :  tensor([[86061.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(881046.2500, grad_fn=<MseLossBackward>)
output :  tensor([[138923.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1159457.8750, grad_fn=<MseLossBackward>)
output :  tensor([[112010.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2280855., grad_fn=<MseLossBackward>)
output :  tensor([[149775.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9087e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173185.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7796e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193266.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3767e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179273.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(527688.7500, grad_fn=<MseLossBackward>)
output :  tensor([[98191.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2861753.7500, grad_fn=<MseLossBackward>)
output :  tensor([[116558.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(886922.5000, grad_fn=<MseLossBackward>)
output :  tensor([[160187.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6702e+08, grad_fn=<MseLossBackward>)
output :  tensor([[198385.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2605197.7500, grad_fn=<MseLossBackward>)
output :  tensor([[146405.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(5784626.5000, grad_fn=<MseLossBackward>)
train_loss: [2.693969e+09]
epoch_result tensor([0.])
output :  tensor([[159683.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1400968.1250, grad_fn=<MseLossBackward>)
output :  tensor([[120606.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1941276.1250, grad_fn=<MseLossBackward>)
output :  tensor([[196061.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(3463204.7500, grad_fn=<MseLossBackward>)
output :  tensor([[178391.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1935272.2500, grad_fn=<MseLossBackward>)
output :  tensor([[155801.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9278e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130912.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(8484113., grad_fn=<MseLossBackward>)
output :  tensor([[140152.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(717885.5000, grad_fn=<MseLossBackward>)
output :  tensor([[117711.1016]], grad_fn=<AddmmBackward>)
loss:  tensor(1661259.1250, grad_fn=<MseLossBackward>)
output :  tensor([[70952.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5508e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166882.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(778447.7500, grad_fn=<MseLossBackward>)
output :  tensor([[142137.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4570643., grad_fn=<MseLossBackward>)
output :  tensor([[224556.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(197122.1250, grad_fn=<MseLossBackward>)
output :  tensor([[168893.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(11285.7422, grad_fn=<MseLossBackward>)
output :  tensor([[245774.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(15407956., grad_fn=<MseLossBackward>)
output :  tensor([[52868.3867]], grad_fn=<AddmmBackward>)
loss:  tensor(4543775., grad_fn=<MseLossBackward>)
output :  tensor([[163769.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7131e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174715.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(81055.8672, grad_fn=<MseLossBackward>)
output :  tensor([[148797.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(59327304., grad_fn=<MseLossBackward>)
output :  tensor([[270583.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(19506852., grad_fn=<MseLossBackward>)
output :  tensor([[196485.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(264437., grad_fn=<MseLossBackward>)
output :  tensor([[138050.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5322e+10, grad_fn=<MseLossBackward>)
output :  tensor([[193372.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(256289.0625, grad_fn=<MseLossBackward>)
output :  tensor([[178633.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1406e+09, grad_fn=<MseLossBackward>)
output :  tensor([[152915.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(3670098., grad_fn=<MseLossBackward>)
output :  tensor([[175272.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(27800410., grad_fn=<MseLossBackward>)
output :  tensor([[85201.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(39259.7070, grad_fn=<MseLossBackward>)
output :  tensor([[171328.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4022e+09, grad_fn=<MseLossBackward>)
output :  tensor([[186204.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1451987.3750, grad_fn=<MseLossBackward>)
output :  tensor([[202322.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8279e+09, grad_fn=<MseLossBackward>)
output :  tensor([[109870.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(16764.1797, grad_fn=<MseLossBackward>)
output :  tensor([[169415.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2511333.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135765.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(539536.1875, grad_fn=<MseLossBackward>)
output :  tensor([[129900.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(810801.7500, grad_fn=<MseLossBackward>)
output :  tensor([[121182.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2831332., grad_fn=<MseLossBackward>)
output :  tensor([[147097.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(9.0586e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172055.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0433e+10, grad_fn=<MseLossBackward>)
output :  tensor([[150819.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1252895.5000, grad_fn=<MseLossBackward>)
output :  tensor([[179421.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(334210.4375, grad_fn=<MseLossBackward>)
output :  tensor([[140716.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(80186.3125, grad_fn=<MseLossBackward>)
output :  tensor([[104408.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0760e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135640.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2980e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136990.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(3962028., grad_fn=<MseLossBackward>)
output :  tensor([[139836.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6478e+08, grad_fn=<MseLossBackward>)
output :  tensor([[222204.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(7812986., grad_fn=<MseLossBackward>)
output :  tensor([[135570.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(11025513., grad_fn=<MseLossBackward>)
output :  tensor([[149812.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(660816.5625, grad_fn=<MseLossBackward>)
output :  tensor([[112638.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(407702.2188, grad_fn=<MseLossBackward>)
output :  tensor([[160321.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(103241.7188, grad_fn=<MseLossBackward>)
output :  tensor([[144388.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5615e+09, grad_fn=<MseLossBackward>)
output :  tensor([[196515.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(20393974., grad_fn=<MseLossBackward>)
output :  tensor([[134485.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1241.4612, grad_fn=<MseLossBackward>)
output :  tensor([[117945.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(63132708., grad_fn=<MseLossBackward>)
output :  tensor([[233339.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(435950.6875, grad_fn=<MseLossBackward>)
output :  tensor([[165146.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3371e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151263.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(59856576., grad_fn=<MseLossBackward>)
output :  tensor([[204332.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8280e+10, grad_fn=<MseLossBackward>)
output :  tensor([[243097.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2299e+10, grad_fn=<MseLossBackward>)
output :  tensor([[147652.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(17241828., grad_fn=<MseLossBackward>)
output :  tensor([[143254.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(85646056., grad_fn=<MseLossBackward>)
output :  tensor([[154200.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(638875.5000, grad_fn=<MseLossBackward>)
output :  tensor([[131150.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1324585.2500, grad_fn=<MseLossBackward>)
output :  tensor([[184115.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7585e+09, grad_fn=<MseLossBackward>)
output :  tensor([[183070.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1059034., grad_fn=<MseLossBackward>)
output :  tensor([[161332.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(27920.3203, grad_fn=<MseLossBackward>)
output :  tensor([[144857.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(3449725.7500, grad_fn=<MseLossBackward>)
output :  tensor([[142898.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(158466.1875, grad_fn=<MseLossBackward>)
output :  tensor([[143168.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(3355708.7500, grad_fn=<MseLossBackward>)
output :  tensor([[172108.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5667e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194946.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8634e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136289.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(44231.3477, grad_fn=<MseLossBackward>)
output :  tensor([[176214.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(18613292., grad_fn=<MseLossBackward>)
output :  tensor([[176281.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(22261736., grad_fn=<MseLossBackward>)
output :  tensor([[115849.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(721995.3750, grad_fn=<MseLossBackward>)
output :  tensor([[217282.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(13820968., grad_fn=<MseLossBackward>)
output :  tensor([[181882.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2614891.2500, grad_fn=<MseLossBackward>)
output :  tensor([[127737.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(5005532.5000, grad_fn=<MseLossBackward>)
output :  tensor([[194141.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(5564217.5000, grad_fn=<MseLossBackward>)
output :  tensor([[172396.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(6267512., grad_fn=<MseLossBackward>)
output :  tensor([[207682.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1886e+10, grad_fn=<MseLossBackward>)
output :  tensor([[208004.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(8970774., grad_fn=<MseLossBackward>)
output :  tensor([[171750.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6606e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195311.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(658912.6875, grad_fn=<MseLossBackward>)
output :  tensor([[110691.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(5329280.5000, grad_fn=<MseLossBackward>)
output :  tensor([[115488.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(8931506., grad_fn=<MseLossBackward>)
output :  tensor([[113576.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2486189.7500, grad_fn=<MseLossBackward>)
output :  tensor([[148288.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2215027.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162140.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2581e+10, grad_fn=<MseLossBackward>)
output :  tensor([[178992.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1014489.6250, grad_fn=<MseLossBackward>)
output :  tensor([[131270.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(14218084., grad_fn=<MseLossBackward>)
output :  tensor([[148014.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(9089471., grad_fn=<MseLossBackward>)
output :  tensor([[184242.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4347e+09, grad_fn=<MseLossBackward>)
output :  tensor([[119222.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(5393498., grad_fn=<MseLossBackward>)
output :  tensor([[202031.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(25316778., grad_fn=<MseLossBackward>)
output :  tensor([[145710.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(505210., grad_fn=<MseLossBackward>)
output :  tensor([[207015.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(34626052., grad_fn=<MseLossBackward>)
output :  tensor([[125894.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(11151.6904, grad_fn=<MseLossBackward>)
output :  tensor([[246149.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(4746475., grad_fn=<MseLossBackward>)
output :  tensor([[235099.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4901e+09, grad_fn=<MseLossBackward>)
output :  tensor([[154419.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2988e+08, grad_fn=<MseLossBackward>)
output :  tensor([[85151.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8328e+08, grad_fn=<MseLossBackward>)
output :  tensor([[190805.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0719e+09, grad_fn=<MseLossBackward>)
output :  tensor([[79847.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(1327806.1250, grad_fn=<MseLossBackward>)
output :  tensor([[140677.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1385512.8750, grad_fn=<MseLossBackward>)
output :  tensor([[76373.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(762401.8125, grad_fn=<MseLossBackward>)
output :  tensor([[147011.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(16472564., grad_fn=<MseLossBackward>)
output :  tensor([[177551.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2405795., grad_fn=<MseLossBackward>)
output :  tensor([[155732.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(4984196., grad_fn=<MseLossBackward>)
output :  tensor([[108797.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1954054.5000, grad_fn=<MseLossBackward>)
output :  tensor([[202376.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2853e+10, grad_fn=<MseLossBackward>)
output :  tensor([[129017.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(268202.5938, grad_fn=<MseLossBackward>)
output :  tensor([[268698.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2771e+08, grad_fn=<MseLossBackward>)
output :  tensor([[304242.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(33152764., grad_fn=<MseLossBackward>)
output :  tensor([[107463.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1360.9182, grad_fn=<MseLossBackward>)
output :  tensor([[174451.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3809084., grad_fn=<MseLossBackward>)
output :  tensor([[134333.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9347e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137419.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2497239.5000, grad_fn=<MseLossBackward>)
output :  tensor([[130519.4922]], grad_fn=<AddmmBackward>)
loss:  tensor(72626.0391, grad_fn=<MseLossBackward>)
output :  tensor([[126849.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(3419639., grad_fn=<MseLossBackward>)
output :  tensor([[137531.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8578e+08, grad_fn=<MseLossBackward>)
output :  tensor([[229688.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7369e+10, grad_fn=<MseLossBackward>)
output :  tensor([[184521.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4486e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144527.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(393540.5625, grad_fn=<MseLossBackward>)
output :  tensor([[131159.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(13392512., grad_fn=<MseLossBackward>)
output :  tensor([[112689.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2071485.5000, grad_fn=<MseLossBackward>)
output :  tensor([[251470.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4343e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136548.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2398239.5000, grad_fn=<MseLossBackward>)
output :  tensor([[205719.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(7395680., grad_fn=<MseLossBackward>)
output :  tensor([[106079.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1391367.7500, grad_fn=<MseLossBackward>)
output :  tensor([[139285.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(441497.9688, grad_fn=<MseLossBackward>)
output :  tensor([[206919.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0908e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181050.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1322823.5000, grad_fn=<MseLossBackward>)
output :  tensor([[188132.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(9810011., grad_fn=<MseLossBackward>)
output :  tensor([[163658.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1124e+10, grad_fn=<MseLossBackward>)
output :  tensor([[295893.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5294e+09, grad_fn=<MseLossBackward>)
output :  tensor([[197908.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(74.3906, grad_fn=<MseLossBackward>)
output :  tensor([[264061.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9265e+10, grad_fn=<MseLossBackward>)
output :  tensor([[213251.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7824e+09, grad_fn=<MseLossBackward>)
output :  tensor([[274455.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8100e+09, grad_fn=<MseLossBackward>)
output :  tensor([[222719.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1640280.5000, grad_fn=<MseLossBackward>)
output :  tensor([[223259.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8473e+10, grad_fn=<MseLossBackward>)
output :  tensor([[194060.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(8639191., grad_fn=<MseLossBackward>)
output :  tensor([[160729.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0067e+09, grad_fn=<MseLossBackward>)
output :  tensor([[133852.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1828453.2500, grad_fn=<MseLossBackward>)
output :  tensor([[132317.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(10126218., grad_fn=<MseLossBackward>)
output :  tensor([[90599.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(160293.8906, grad_fn=<MseLossBackward>)
output :  tensor([[107207.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(627821., grad_fn=<MseLossBackward>)
output :  tensor([[271842.]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2556e+09, grad_fn=<MseLossBackward>)
output :  tensor([[231593.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(11605307., grad_fn=<MseLossBackward>)
output :  tensor([[147531.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(6406119., grad_fn=<MseLossBackward>)
output :  tensor([[138910.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1988981.3750, grad_fn=<MseLossBackward>)
output :  tensor([[174852.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1253070.3750, grad_fn=<MseLossBackward>)
output :  tensor([[147639.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(5711652., grad_fn=<MseLossBackward>)
output :  tensor([[163285.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(9.7436e+08, grad_fn=<MseLossBackward>)
output :  tensor([[164223.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(602394.2500, grad_fn=<MseLossBackward>)
output :  tensor([[134649.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(5523675., grad_fn=<MseLossBackward>)
output :  tensor([[194685.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2107e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113858.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(3453528.5000, grad_fn=<MseLossBackward>)
output :  tensor([[175404.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(11588067., grad_fn=<MseLossBackward>)
output :  tensor([[120413.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(171163.2031, grad_fn=<MseLossBackward>)
output :  tensor([[87480.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(230985.3750, grad_fn=<MseLossBackward>)
output :  tensor([[178849.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1323794.1250, grad_fn=<MseLossBackward>)
output :  tensor([[109544.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(126335.8125, grad_fn=<MseLossBackward>)
output :  tensor([[240292.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1670031.2500, grad_fn=<MseLossBackward>)
output :  tensor([[250530.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(30585566., grad_fn=<MseLossBackward>)
output :  tensor([[127248.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(5069217., grad_fn=<MseLossBackward>)
output :  tensor([[107127.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(3354306.5000, grad_fn=<MseLossBackward>)
output :  tensor([[286445.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2713e+10, grad_fn=<MseLossBackward>)
output :  tensor([[170418.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1170385.8750, grad_fn=<MseLossBackward>)
output :  tensor([[122414.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(6686103., grad_fn=<MseLossBackward>)
output :  tensor([[147454.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(8.6758e+08, grad_fn=<MseLossBackward>)
output :  tensor([[198330.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4552e+08, grad_fn=<MseLossBackward>)
output :  tensor([[140557.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(196235.1562, grad_fn=<MseLossBackward>)
output :  tensor([[156744.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5192e+10, grad_fn=<MseLossBackward>)
output :  tensor([[150825.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(9455529., grad_fn=<MseLossBackward>)
output :  tensor([[131827.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(5418784., grad_fn=<MseLossBackward>)
output :  tensor([[240665.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8998e+10, grad_fn=<MseLossBackward>)
output :  tensor([[399082.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(8511442., grad_fn=<MseLossBackward>)
output :  tensor([[105157.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(14764806., grad_fn=<MseLossBackward>)
output :  tensor([[111133.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(54263252., grad_fn=<MseLossBackward>)
output :  tensor([[156749.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(7566539.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135325.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4873e+08, grad_fn=<MseLossBackward>)
output :  tensor([[162370.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5557e+09, grad_fn=<MseLossBackward>)
output :  tensor([[176393.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4080e+09, grad_fn=<MseLossBackward>)
output :  tensor([[105974.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(5638547., grad_fn=<MseLossBackward>)
output :  tensor([[143109.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(4450583.5000, grad_fn=<MseLossBackward>)
output :  tensor([[361511.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(33440920., grad_fn=<MseLossBackward>)
output :  tensor([[200866.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8232e+09, grad_fn=<MseLossBackward>)
output :  tensor([[177268.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(3128808.2500, grad_fn=<MseLossBackward>)
output :  tensor([[201133.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(3121626.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139909.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(827645.0625, grad_fn=<MseLossBackward>)
output :  tensor([[194610.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(12182.6406, grad_fn=<MseLossBackward>)
output :  tensor([[138038.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(9.3262e+08, grad_fn=<MseLossBackward>)
output :  tensor([[182638.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2685348., grad_fn=<MseLossBackward>)
output :  tensor([[241798.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(40665.2422, grad_fn=<MseLossBackward>)
output :  tensor([[174264.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(69778.5234, grad_fn=<MseLossBackward>)
output :  tensor([[107978.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(449.2413, grad_fn=<MseLossBackward>)
output :  tensor([[264577.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(274.3164, grad_fn=<MseLossBackward>)
output :  tensor([[252426.]], grad_fn=<AddmmBackward>)
loss:  tensor(5885476., grad_fn=<MseLossBackward>)
output :  tensor([[122561.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(191885.0625, grad_fn=<MseLossBackward>)
output :  tensor([[212246.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9381e+09, grad_fn=<MseLossBackward>)
output :  tensor([[303232.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8699e+08, grad_fn=<MseLossBackward>)
output :  tensor([[210543.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(12553513., grad_fn=<MseLossBackward>)
output :  tensor([[210616.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6740e+10, grad_fn=<MseLossBackward>)
output :  tensor([[157605.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(86877.5625, grad_fn=<MseLossBackward>)
output :  tensor([[170869.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(773685.1875, grad_fn=<MseLossBackward>)
output :  tensor([[159195.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(5124635., grad_fn=<MseLossBackward>)
output :  tensor([[173720.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(13844329., grad_fn=<MseLossBackward>)
output :  tensor([[234168.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1446e+09, grad_fn=<MseLossBackward>)
output :  tensor([[212246.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9618e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165234.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3249e+08, grad_fn=<MseLossBackward>)
output :  tensor([[120061.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(8635930., grad_fn=<MseLossBackward>)
output :  tensor([[177709.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(503634.1562, grad_fn=<MseLossBackward>)
output :  tensor([[177869.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7454e+09, grad_fn=<MseLossBackward>)
output :  tensor([[202408.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6944e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134156.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(76081.1562, grad_fn=<MseLossBackward>)
output :  tensor([[151798.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(9.1197e+08, grad_fn=<MseLossBackward>)
output :  tensor([[276186.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(661934.8125, grad_fn=<MseLossBackward>)
output :  tensor([[88493.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(12206726., grad_fn=<MseLossBackward>)
output :  tensor([[237990.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2222335.5000, grad_fn=<MseLossBackward>)
output :  tensor([[256966.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0625e+11, grad_fn=<MseLossBackward>)
output :  tensor([[172568.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(6599038.5000, grad_fn=<MseLossBackward>)
output :  tensor([[191351.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9052e+09, grad_fn=<MseLossBackward>)
output :  tensor([[152600.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(5759625., grad_fn=<MseLossBackward>)
output :  tensor([[205396.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1736e+09, grad_fn=<MseLossBackward>)
output :  tensor([[129660.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(436198.3438, grad_fn=<MseLossBackward>)
output :  tensor([[150766.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(33255586., grad_fn=<MseLossBackward>)
output :  tensor([[173168.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(9.4059e+08, grad_fn=<MseLossBackward>)
output :  tensor([[186044.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(37884.9727, grad_fn=<MseLossBackward>)
output :  tensor([[128905.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(8443610., grad_fn=<MseLossBackward>)
output :  tensor([[139078.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(6646889.5000, grad_fn=<MseLossBackward>)
output :  tensor([[177512.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(20361106., grad_fn=<MseLossBackward>)
output :  tensor([[199412.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5591e+09, grad_fn=<MseLossBackward>)
output :  tensor([[242442.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(311172.2188, grad_fn=<MseLossBackward>)
output :  tensor([[155946.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(896661.0625, grad_fn=<MseLossBackward>)
output :  tensor([[199411.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(11638972., grad_fn=<MseLossBackward>)
output :  tensor([[161897.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2033e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176460.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(9238655., grad_fn=<MseLossBackward>)
output :  tensor([[176759.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(9861464., grad_fn=<MseLossBackward>)
output :  tensor([[93788.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(10314636., grad_fn=<MseLossBackward>)
output :  tensor([[174804.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1066e+10, grad_fn=<MseLossBackward>)
output :  tensor([[137529.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(6400504.5000, grad_fn=<MseLossBackward>)
output :  tensor([[122181.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(51573380., grad_fn=<MseLossBackward>)
output :  tensor([[170760.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(10496081., grad_fn=<MseLossBackward>)
output :  tensor([[83865.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1288154.1250, grad_fn=<MseLossBackward>)
output :  tensor([[287300.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(7285107., grad_fn=<MseLossBackward>)
output :  tensor([[167612.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(6825483., grad_fn=<MseLossBackward>)
output :  tensor([[191822.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9979e+10, grad_fn=<MseLossBackward>)
output :  tensor([[239493.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9266e+08, grad_fn=<MseLossBackward>)
output :  tensor([[149946.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1110685.5000, grad_fn=<MseLossBackward>)
output :  tensor([[121730.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(5149779., grad_fn=<MseLossBackward>)
output :  tensor([[112194.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(59370276., grad_fn=<MseLossBackward>)
output :  tensor([[143595.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1771e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173798.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(40444.9805, grad_fn=<MseLossBackward>)
output :  tensor([[113468.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(9.5904e+08, grad_fn=<MseLossBackward>)
output :  tensor([[204896.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2792e+10, grad_fn=<MseLossBackward>)
output :  tensor([[242082.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(339488.3125, grad_fn=<MseLossBackward>)
output :  tensor([[250505.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0934e+10, grad_fn=<MseLossBackward>)
output :  tensor([[221661.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0063e+08, grad_fn=<MseLossBackward>)
output :  tensor([[194175.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4720e+10, grad_fn=<MseLossBackward>)
output :  tensor([[191105.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(13000532., grad_fn=<MseLossBackward>)
output :  tensor([[206499.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7685e+10, grad_fn=<MseLossBackward>)
output :  tensor([[185759.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2572e+10, grad_fn=<MseLossBackward>)
output :  tensor([[178075.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(442162.6562, grad_fn=<MseLossBackward>)
output :  tensor([[151716.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(80336.8125, grad_fn=<MseLossBackward>)
output :  tensor([[333069.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(15446128., grad_fn=<MseLossBackward>)
output :  tensor([[209959.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(4163512.7500, grad_fn=<MseLossBackward>)
output :  tensor([[159917.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(6834.6387, grad_fn=<MseLossBackward>)
output :  tensor([[183250.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3930e+09, grad_fn=<MseLossBackward>)
output :  tensor([[106565.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2452209.2500, grad_fn=<MseLossBackward>)
output :  tensor([[267888.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2433e+10, grad_fn=<MseLossBackward>)
output :  tensor([[171660.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(5016760., grad_fn=<MseLossBackward>)
output :  tensor([[219378.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(34558416., grad_fn=<MseLossBackward>)
output :  tensor([[201045.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9819e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177081.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(4485990., grad_fn=<MseLossBackward>)
output :  tensor([[199666.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(4553556., grad_fn=<MseLossBackward>)
output :  tensor([[151822.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(10095215., grad_fn=<MseLossBackward>)
output :  tensor([[153056.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8150e+09, grad_fn=<MseLossBackward>)
output :  tensor([[119835.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1784311.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138845.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1333267.1250, grad_fn=<MseLossBackward>)
output :  tensor([[145471.]], grad_fn=<AddmmBackward>)
loss:  tensor(12453841., grad_fn=<MseLossBackward>)
output :  tensor([[202638.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5715e+10, grad_fn=<MseLossBackward>)
output :  tensor([[160367.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(752366.5000, grad_fn=<MseLossBackward>)
output :  tensor([[102704.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(10266617., grad_fn=<MseLossBackward>)
output :  tensor([[224719.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3351e+08, grad_fn=<MseLossBackward>)
output :  tensor([[186962.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6064e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176218.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(70955.6406, grad_fn=<MseLossBackward>)
output :  tensor([[83623.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2634636.2500, grad_fn=<MseLossBackward>)
output :  tensor([[131633.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(9819018., grad_fn=<MseLossBackward>)
output :  tensor([[214159.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(25460.1914, grad_fn=<MseLossBackward>)
output :  tensor([[142920.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1164308.5000, grad_fn=<MseLossBackward>)
output :  tensor([[130996.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(993510.5625, grad_fn=<MseLossBackward>)
output :  tensor([[140831.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(3127758., grad_fn=<MseLossBackward>)
output :  tensor([[180726.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8685e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144983.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(966626.9375, grad_fn=<MseLossBackward>)
output :  tensor([[160942.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(887481.7500, grad_fn=<MseLossBackward>)
output :  tensor([[215152.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(23284.8516, grad_fn=<MseLossBackward>)
output :  tensor([[139162.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1671e+09, grad_fn=<MseLossBackward>)
output :  tensor([[258266.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(10669716., grad_fn=<MseLossBackward>)
output :  tensor([[157396.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4423003.5000, grad_fn=<MseLossBackward>)
output :  tensor([[129417.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(841777.5625, grad_fn=<MseLossBackward>)
output :  tensor([[96607.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(2585488.2500, grad_fn=<MseLossBackward>)
output :  tensor([[155666.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0647e+09, grad_fn=<MseLossBackward>)
output :  tensor([[180630.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(533219.4375, grad_fn=<MseLossBackward>)
output :  tensor([[124180.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(13543550., grad_fn=<MseLossBackward>)
output :  tensor([[185465.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8909e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146136.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4404e+09, grad_fn=<MseLossBackward>)
output :  tensor([[149791.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(11826.5625, grad_fn=<MseLossBackward>)
output :  tensor([[187507.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(58798.6719, grad_fn=<MseLossBackward>)
output :  tensor([[251424.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7349e+09, grad_fn=<MseLossBackward>)
output :  tensor([[91350.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(22401.6699, grad_fn=<MseLossBackward>)
output :  tensor([[236576.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(11721850., grad_fn=<MseLossBackward>)
output :  tensor([[125187.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(10974261., grad_fn=<MseLossBackward>)
output :  tensor([[166885.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(9.8039e+09, grad_fn=<MseLossBackward>)
output :  tensor([[115708.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4674e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177974.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(3899020.5000, grad_fn=<MseLossBackward>)
output :  tensor([[164583.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3422e+08, grad_fn=<MseLossBackward>)
output :  tensor([[155798.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4000e+08, grad_fn=<MseLossBackward>)
output :  tensor([[241161.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(4673906., grad_fn=<MseLossBackward>)
output :  tensor([[229094.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3552e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128312.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1723517.6250, grad_fn=<MseLossBackward>)
output :  tensor([[127447.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2095120.5000, grad_fn=<MseLossBackward>)
output :  tensor([[222435.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(20832948., grad_fn=<MseLossBackward>)
output :  tensor([[229593.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(19417242., grad_fn=<MseLossBackward>)
output :  tensor([[228266.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2455342., grad_fn=<MseLossBackward>)
output :  tensor([[149117.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1248073., grad_fn=<MseLossBackward>)
output :  tensor([[210175.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(30635.9375, grad_fn=<MseLossBackward>)
output :  tensor([[132646.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5994e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136216.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(13810979., grad_fn=<MseLossBackward>)
output :  tensor([[309606.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(29094898., grad_fn=<MseLossBackward>)
output :  tensor([[140559.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(193696.2656, grad_fn=<MseLossBackward>)
output :  tensor([[122066.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0324e+09, grad_fn=<MseLossBackward>)
output :  tensor([[108858.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(410991.1875, grad_fn=<MseLossBackward>)
output :  tensor([[155363.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9365e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179258.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(9.1138e+09, grad_fn=<MseLossBackward>)
output :  tensor([[170476.]], grad_fn=<AddmmBackward>)
loss:  tensor(6370576., grad_fn=<MseLossBackward>)
output :  tensor([[189440.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3363e+08, grad_fn=<MseLossBackward>)
output :  tensor([[104484.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(20107938., grad_fn=<MseLossBackward>)
output :  tensor([[180167.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1362582., grad_fn=<MseLossBackward>)
output :  tensor([[166677.]], grad_fn=<AddmmBackward>)
loss:  tensor(1495729., grad_fn=<MseLossBackward>)
output :  tensor([[140807.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(3267282.2500, grad_fn=<MseLossBackward>)
output :  tensor([[257053.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0414e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143914.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4709e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174532.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(2348508.2500, grad_fn=<MseLossBackward>)
output :  tensor([[143841.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(14757362., grad_fn=<MseLossBackward>)
output :  tensor([[196608.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(15140124., grad_fn=<MseLossBackward>)
output :  tensor([[168604.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1948118., grad_fn=<MseLossBackward>)
output :  tensor([[239830.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(17383818., grad_fn=<MseLossBackward>)
output :  tensor([[135003.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(253402.1250, grad_fn=<MseLossBackward>)
output :  tensor([[153000.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(13326036., grad_fn=<MseLossBackward>)
output :  tensor([[212588.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(5817518., grad_fn=<MseLossBackward>)
output :  tensor([[162736.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(5123503., grad_fn=<MseLossBackward>)
output :  tensor([[188206.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(629270.3750, grad_fn=<MseLossBackward>)
output :  tensor([[133874.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3127e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129371.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(138041.2812, grad_fn=<MseLossBackward>)
output :  tensor([[141274.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1625107.1250, grad_fn=<MseLossBackward>)
output :  tensor([[199039.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9647e+09, grad_fn=<MseLossBackward>)
output :  tensor([[167394.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7451e+09, grad_fn=<MseLossBackward>)
output :  tensor([[77882.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1978e+08, grad_fn=<MseLossBackward>)
output :  tensor([[94341.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(96855584., grad_fn=<MseLossBackward>)
output :  tensor([[251324.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(3873270., grad_fn=<MseLossBackward>)
output :  tensor([[203461.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1553e+09, grad_fn=<MseLossBackward>)
output :  tensor([[114544.]], grad_fn=<AddmmBackward>)
loss:  tensor(207936., grad_fn=<MseLossBackward>)
output :  tensor([[159136.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0449e+08, grad_fn=<MseLossBackward>)
output :  tensor([[205452.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1163e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179366.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2144e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157397.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(5745908.5000, grad_fn=<MseLossBackward>)
output :  tensor([[168321.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2816995., grad_fn=<MseLossBackward>)
output :  tensor([[115620.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(384748.8438, grad_fn=<MseLossBackward>)
output :  tensor([[167450.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5502e+08, grad_fn=<MseLossBackward>)
output :  tensor([[192129.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1817e+08, grad_fn=<MseLossBackward>)
output :  tensor([[220456.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(914025.6250, grad_fn=<MseLossBackward>)
output :  tensor([[243330.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5167e+11, grad_fn=<MseLossBackward>)
output :  tensor([[145711.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1659507.5000, grad_fn=<MseLossBackward>)
output :  tensor([[109373.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(798942.6875, grad_fn=<MseLossBackward>)
output :  tensor([[169698.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4888e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148601.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(3604955., grad_fn=<MseLossBackward>)
output :  tensor([[231283.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(32677480., grad_fn=<MseLossBackward>)
output :  tensor([[114443.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(310127.1562, grad_fn=<MseLossBackward>)
output :  tensor([[184659.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(3096225.2500, grad_fn=<MseLossBackward>)
output :  tensor([[185607.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1192668.7500, grad_fn=<MseLossBackward>)
output :  tensor([[164857.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4069e+10, grad_fn=<MseLossBackward>)
output :  tensor([[95209.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0192e+08, grad_fn=<MseLossBackward>)
output :  tensor([[233293.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(32560932., grad_fn=<MseLossBackward>)
output :  tensor([[178458.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(6041841., grad_fn=<MseLossBackward>)
output :  tensor([[141102.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1215402.8750, grad_fn=<MseLossBackward>)
output :  tensor([[237364.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(5589604., grad_fn=<MseLossBackward>)
output :  tensor([[161478.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2314201.5000, grad_fn=<MseLossBackward>)
output :  tensor([[200126.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5593e+10, grad_fn=<MseLossBackward>)
output :  tensor([[133733.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1603072.5000, grad_fn=<MseLossBackward>)
output :  tensor([[186007.]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7634e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135738.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(68243.3984, grad_fn=<MseLossBackward>)
output :  tensor([[222236.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8943e+08, grad_fn=<MseLossBackward>)
output :  tensor([[223968.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7765e+08, grad_fn=<MseLossBackward>)
output :  tensor([[90593.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(352752.4688, grad_fn=<MseLossBackward>)
output :  tensor([[161207.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(3144803.5000, grad_fn=<MseLossBackward>)
output :  tensor([[242137.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6574e+10, grad_fn=<MseLossBackward>)
output :  tensor([[146890.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3574108.5000, grad_fn=<MseLossBackward>)
output :  tensor([[110727.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9121e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164919.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(176281.8906, grad_fn=<MseLossBackward>)
output :  tensor([[144514.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(264581.6250, grad_fn=<MseLossBackward>)
output :  tensor([[129237.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(1076454.8750, grad_fn=<MseLossBackward>)
output :  tensor([[190863.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6426e+09, grad_fn=<MseLossBackward>)
output :  tensor([[122106.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(155032.9062, grad_fn=<MseLossBackward>)
output :  tensor([[153188.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1411715.2500, grad_fn=<MseLossBackward>)
output :  tensor([[168109.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(13250283., grad_fn=<MseLossBackward>)
output :  tensor([[150729.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(73415.5938, grad_fn=<MseLossBackward>)
output :  tensor([[162295.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(365193.5938, grad_fn=<MseLossBackward>)
output :  tensor([[137265.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9892e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133217.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1481317.2500, grad_fn=<MseLossBackward>)
output :  tensor([[158864.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9462e+08, grad_fn=<MseLossBackward>)
output :  tensor([[145832.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2823870.2500, grad_fn=<MseLossBackward>)
output :  tensor([[156985.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(22701800., grad_fn=<MseLossBackward>)
output :  tensor([[141448.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9532e+08, grad_fn=<MseLossBackward>)
output :  tensor([[147560.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1536980., grad_fn=<MseLossBackward>)
output :  tensor([[183447.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(20724260., grad_fn=<MseLossBackward>)
output :  tensor([[171975.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(8850718., grad_fn=<MseLossBackward>)
output :  tensor([[179846.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(23437.6953, grad_fn=<MseLossBackward>)
output :  tensor([[219547.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(204332.2500, grad_fn=<MseLossBackward>)
output :  tensor([[112531.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(21448694., grad_fn=<MseLossBackward>)
output :  tensor([[136613.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3721e+08, grad_fn=<MseLossBackward>)
output :  tensor([[285843.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(24502.0312, grad_fn=<MseLossBackward>)
output :  tensor([[117965.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(3864695.2500, grad_fn=<MseLossBackward>)
output :  tensor([[172377.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2679e+09, grad_fn=<MseLossBackward>)
output :  tensor([[185351.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(123420.4688, grad_fn=<MseLossBackward>)
output :  tensor([[178439.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(49851544., grad_fn=<MseLossBackward>)
output :  tensor([[251424.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5581e+08, grad_fn=<MseLossBackward>)
output :  tensor([[224410.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(5809079., grad_fn=<MseLossBackward>)
output :  tensor([[133888.]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8333e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177287.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8987e+08, grad_fn=<MseLossBackward>)
output :  tensor([[124431.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(186165.2812, grad_fn=<MseLossBackward>)
output :  tensor([[180546.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6685e+10, grad_fn=<MseLossBackward>)
output :  tensor([[153151.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(22923.8516, grad_fn=<MseLossBackward>)
output :  tensor([[157105.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1248e+08, grad_fn=<MseLossBackward>)
output :  tensor([[203230.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(9421159., grad_fn=<MseLossBackward>)
output :  tensor([[143223.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1500e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175427.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(328024.6562, grad_fn=<MseLossBackward>)
output :  tensor([[248484.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6193e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148308.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(95075.8672, grad_fn=<MseLossBackward>)
output :  tensor([[203379.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(510577.2500, grad_fn=<MseLossBackward>)
output :  tensor([[159933.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(261.5295, grad_fn=<MseLossBackward>)
output :  tensor([[126556.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4866e+09, grad_fn=<MseLossBackward>)
output :  tensor([[138059.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(5335450.5000, grad_fn=<MseLossBackward>)
output :  tensor([[178746.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(27602546., grad_fn=<MseLossBackward>)
output :  tensor([[196996.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(48948388., grad_fn=<MseLossBackward>)
output :  tensor([[211577.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9942e+09, grad_fn=<MseLossBackward>)
output :  tensor([[253951.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(9295925., grad_fn=<MseLossBackward>)
output :  tensor([[179026.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9592e+10, grad_fn=<MseLossBackward>)
output :  tensor([[147930.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1844e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146896.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(5744635.5000, grad_fn=<MseLossBackward>)
output :  tensor([[74848.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2144e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144700.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(94101520., grad_fn=<MseLossBackward>)
output :  tensor([[127747.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1328220.2500, grad_fn=<MseLossBackward>)
output :  tensor([[156279.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(5195194., grad_fn=<MseLossBackward>)
output :  tensor([[125540.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(2131440.2500, grad_fn=<MseLossBackward>)
output :  tensor([[78668.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(4700258., grad_fn=<MseLossBackward>)
output :  tensor([[83054.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(1112184.5000, grad_fn=<MseLossBackward>)
output :  tensor([[234145.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(4601494., grad_fn=<MseLossBackward>)
output :  tensor([[141992.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(8.6979e+08, grad_fn=<MseLossBackward>)
output :  tensor([[125399.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(26018368., grad_fn=<MseLossBackward>)
output :  tensor([[168773.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3145191.5000, grad_fn=<MseLossBackward>)
output :  tensor([[234598.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(160888.7344, grad_fn=<MseLossBackward>)
output :  tensor([[188222.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(15346439., grad_fn=<MseLossBackward>)
output :  tensor([[155530.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(220327.5625, grad_fn=<MseLossBackward>)
output :  tensor([[197608.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(84781.0625, grad_fn=<MseLossBackward>)
output :  tensor([[195974.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6831e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137276.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(76236.3906, grad_fn=<MseLossBackward>)
output :  tensor([[155985.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(970748.3750, grad_fn=<MseLossBackward>)
output :  tensor([[138475.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(6129879.5000, grad_fn=<MseLossBackward>)
output :  tensor([[194737.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2435e+09, grad_fn=<MseLossBackward>)
output :  tensor([[156458.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(6046373.5000, grad_fn=<MseLossBackward>)
output :  tensor([[142540.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4049e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145658.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(575274.8750, grad_fn=<MseLossBackward>)
output :  tensor([[206571.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(29465050., grad_fn=<MseLossBackward>)
output :  tensor([[107519.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5124e+08, grad_fn=<MseLossBackward>)
output :  tensor([[171168.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(13456631., grad_fn=<MseLossBackward>)
output :  tensor([[128059.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(3552.3462, grad_fn=<MseLossBackward>)
output :  tensor([[148369.]], grad_fn=<AddmmBackward>)
loss:  tensor(1874161., grad_fn=<MseLossBackward>)
output :  tensor([[107313.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0187e+09, grad_fn=<MseLossBackward>)
output :  tensor([[141000.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(12255032., grad_fn=<MseLossBackward>)
output :  tensor([[230542.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(29781408., grad_fn=<MseLossBackward>)
output :  tensor([[142756.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(5033713., grad_fn=<MseLossBackward>)
output :  tensor([[140505.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(9030870., grad_fn=<MseLossBackward>)
output :  tensor([[165354.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3954e+09, grad_fn=<MseLossBackward>)
output :  tensor([[263220.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1844e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179001.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(16008251., grad_fn=<MseLossBackward>)
output :  tensor([[105708.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(8599098., grad_fn=<MseLossBackward>)
output :  tensor([[197793.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3532e+09, grad_fn=<MseLossBackward>)
output :  tensor([[160624.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2637579., grad_fn=<MseLossBackward>)
output :  tensor([[160318.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7136e+10, grad_fn=<MseLossBackward>)
output :  tensor([[98366.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(4453.4766, grad_fn=<MseLossBackward>)
output :  tensor([[121397.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(4850077., grad_fn=<MseLossBackward>)
output :  tensor([[154939.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1124991.6250, grad_fn=<MseLossBackward>)
output :  tensor([[140888.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(789932.1250, grad_fn=<MseLossBackward>)
output :  tensor([[198668.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1771935.3750, grad_fn=<MseLossBackward>)
output :  tensor([[143519.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2307740.7500, grad_fn=<MseLossBackward>)
output :  tensor([[264345.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(4267065., grad_fn=<MseLossBackward>)
output :  tensor([[127600.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1972e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164625.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(764613.6250, grad_fn=<MseLossBackward>)
output :  tensor([[190778.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(5193698.5000, grad_fn=<MseLossBackward>)
output :  tensor([[123815.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9087e+08, grad_fn=<MseLossBackward>)
output :  tensor([[247059.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(8648102., grad_fn=<MseLossBackward>)
output :  tensor([[157438.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7386e+08, grad_fn=<MseLossBackward>)
output :  tensor([[243557.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(3213280.2500, grad_fn=<MseLossBackward>)
output :  tensor([[142411.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2522190.7500, grad_fn=<MseLossBackward>)
output :  tensor([[207641.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(5563849., grad_fn=<MseLossBackward>)
output :  tensor([[176809.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(19442726., grad_fn=<MseLossBackward>)
output :  tensor([[151280.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(7393810.5000, grad_fn=<MseLossBackward>)
output :  tensor([[121867.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(14960094., grad_fn=<MseLossBackward>)
output :  tensor([[238640.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3474e+09, grad_fn=<MseLossBackward>)
output :  tensor([[234697.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(28119986., grad_fn=<MseLossBackward>)
output :  tensor([[151824.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2287041.7500, grad_fn=<MseLossBackward>)
output :  tensor([[256509.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2591345.2500, grad_fn=<MseLossBackward>)
output :  tensor([[122497.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(63894420., grad_fn=<MseLossBackward>)
output :  tensor([[175010.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(979295.8125, grad_fn=<MseLossBackward>)
output :  tensor([[158015.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3936318., grad_fn=<MseLossBackward>)
output :  tensor([[130306.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(481169.8438, grad_fn=<MseLossBackward>)
output :  tensor([[198746.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7951e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164767.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(589440.0625, grad_fn=<MseLossBackward>)
output :  tensor([[160220.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(7725794., grad_fn=<MseLossBackward>)
output :  tensor([[156487.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2287609., grad_fn=<MseLossBackward>)
output :  tensor([[152374.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(6122454.5000, grad_fn=<MseLossBackward>)
output :  tensor([[174630.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2420e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158775.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1499247.2500, grad_fn=<MseLossBackward>)
output :  tensor([[371810.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4786e+08, grad_fn=<MseLossBackward>)
output :  tensor([[124251.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(7555455., grad_fn=<MseLossBackward>)
output :  tensor([[130114.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9905e+09, grad_fn=<MseLossBackward>)
output :  tensor([[284237.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(9149680., grad_fn=<MseLossBackward>)
output :  tensor([[159846.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(4636956.5000, grad_fn=<MseLossBackward>)
output :  tensor([[132014.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3257e+08, grad_fn=<MseLossBackward>)
output :  tensor([[241517.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(90583696., grad_fn=<MseLossBackward>)
output :  tensor([[178418.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(4331992., grad_fn=<MseLossBackward>)
output :  tensor([[155175.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(10080823., grad_fn=<MseLossBackward>)
output :  tensor([[147496.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(6234775., grad_fn=<MseLossBackward>)
output :  tensor([[155817.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5786e+08, grad_fn=<MseLossBackward>)
output :  tensor([[100050.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2537.6406, grad_fn=<MseLossBackward>)
output :  tensor([[82013.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8459e+08, grad_fn=<MseLossBackward>)
output :  tensor([[164260.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(547415., grad_fn=<MseLossBackward>)
output :  tensor([[187664.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6270e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158386.]], grad_fn=<AddmmBackward>)
loss:  tensor(148996., grad_fn=<MseLossBackward>)
output :  tensor([[159680.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(4756284., grad_fn=<MseLossBackward>)
output :  tensor([[136622.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(684187.4375, grad_fn=<MseLossBackward>)
output :  tensor([[205651.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(89158.2266, grad_fn=<MseLossBackward>)
output :  tensor([[140760.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(7618549., grad_fn=<MseLossBackward>)
output :  tensor([[181220.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6584e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145691.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(94873.6250, grad_fn=<MseLossBackward>)
output :  tensor([[111292.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0046e+08, grad_fn=<MseLossBackward>)
output :  tensor([[92787.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1470762.5000, grad_fn=<MseLossBackward>)
output :  tensor([[174428.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(326576.5312, grad_fn=<MseLossBackward>)
output :  tensor([[259077.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1748882.2500, grad_fn=<MseLossBackward>)
output :  tensor([[140329.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1371131.2500, grad_fn=<MseLossBackward>)
output :  tensor([[158631.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1596748.1250, grad_fn=<MseLossBackward>)
output :  tensor([[133534.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1069737.7500, grad_fn=<MseLossBackward>)
output :  tensor([[149520.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(426.0354, grad_fn=<MseLossBackward>)
output :  tensor([[171355.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(11942424., grad_fn=<MseLossBackward>)
output :  tensor([[127089.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(7933.5205, grad_fn=<MseLossBackward>)
output :  tensor([[175472.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2857e+08, grad_fn=<MseLossBackward>)
output :  tensor([[158208.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1461114.3750, grad_fn=<MseLossBackward>)
output :  tensor([[116626.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(16041.8057, grad_fn=<MseLossBackward>)
output :  tensor([[161535.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1071e+09, grad_fn=<MseLossBackward>)
output :  tensor([[51740.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(67303.7656, grad_fn=<MseLossBackward>)
output :  tensor([[233769.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1985e+09, grad_fn=<MseLossBackward>)
output :  tensor([[200807.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(36936.0352, grad_fn=<MseLossBackward>)
output :  tensor([[183714.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1653354., grad_fn=<MseLossBackward>)
output :  tensor([[107338.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(1792356.1250, grad_fn=<MseLossBackward>)
output :  tensor([[89597.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(6745180., grad_fn=<MseLossBackward>)
output :  tensor([[143358.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(11277948., grad_fn=<MseLossBackward>)
output :  tensor([[217301.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8827e+09, grad_fn=<MseLossBackward>)
output :  tensor([[198116.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(88041272., grad_fn=<MseLossBackward>)
output :  tensor([[168339.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(11154765., grad_fn=<MseLossBackward>)
output :  tensor([[172197.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(8.6123e+09, grad_fn=<MseLossBackward>)
output :  tensor([[191817.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(3303703.7500, grad_fn=<MseLossBackward>)
output :  tensor([[89682.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(7196141.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138760.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1537483.7500, grad_fn=<MseLossBackward>)
output :  tensor([[109122.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1897506.2500, grad_fn=<MseLossBackward>)
output :  tensor([[150589.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1402e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172368.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7113e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193223.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3868e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180943.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(890133.3125, grad_fn=<MseLossBackward>)
output :  tensor([[98590.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(4370321., grad_fn=<MseLossBackward>)
output :  tensor([[118297.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(635358.4375, grad_fn=<MseLossBackward>)
output :  tensor([[160567.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4910e+08, grad_fn=<MseLossBackward>)
output :  tensor([[201547.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2395433.2500, grad_fn=<MseLossBackward>)
output :  tensor([[144320.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(102530.0391, grad_fn=<MseLossBackward>)
train_loss: [2.6731151e+09]
epoch_result tensor([0.])
output :  tensor([[157815.]], grad_fn=<AddmmBackward>)
loss:  tensor(469225., grad_fn=<MseLossBackward>)
output :  tensor([[124229.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(4970322., grad_fn=<MseLossBackward>)
output :  tensor([[194238.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1420.3477, grad_fn=<MseLossBackward>)
output :  tensor([[178797.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3231006.2500, grad_fn=<MseLossBackward>)
output :  tensor([[155255.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1731e+08, grad_fn=<MseLossBackward>)
output :  tensor([[132211.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(17740550., grad_fn=<MseLossBackward>)
output :  tensor([[142528.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2337315.5000, grad_fn=<MseLossBackward>)
output :  tensor([[118852.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(21783.9141, grad_fn=<MseLossBackward>)
output :  tensor([[72569.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9794e+08, grad_fn=<MseLossBackward>)
output :  tensor([[164302.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2880445.5000, grad_fn=<MseLossBackward>)
output :  tensor([[136847.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(9938355., grad_fn=<MseLossBackward>)
output :  tensor([[224472.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(278256.2500, grad_fn=<MseLossBackward>)
output :  tensor([[166537.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(6062059.5000, grad_fn=<MseLossBackward>)
output :  tensor([[247731.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(3874746.2500, grad_fn=<MseLossBackward>)
output :  tensor([[55556.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(310031.4688, grad_fn=<MseLossBackward>)
output :  tensor([[165536.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4252e+08, grad_fn=<MseLossBackward>)
output :  tensor([[183001.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(64017000., grad_fn=<MseLossBackward>)
output :  tensor([[155925.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(329601.5625, grad_fn=<MseLossBackward>)
output :  tensor([[273348.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2726213.7500, grad_fn=<MseLossBackward>)
output :  tensor([[196379.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(385291.7812, grad_fn=<MseLossBackward>)
output :  tensor([[136215.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6333e+10, grad_fn=<MseLossBackward>)
output :  tensor([[193666.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(45255.9141, grad_fn=<MseLossBackward>)
output :  tensor([[176671.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3260e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151322.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(104268.4453, grad_fn=<MseLossBackward>)
output :  tensor([[171870.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3500114.7500, grad_fn=<MseLossBackward>)
output :  tensor([[83598.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(3247119.5000, grad_fn=<MseLossBackward>)
output :  tensor([[169244.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1634e+09, grad_fn=<MseLossBackward>)
output :  tensor([[186161.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1350135.1250, grad_fn=<MseLossBackward>)
output :  tensor([[203662.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6872e+09, grad_fn=<MseLossBackward>)
output :  tensor([[111850.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(3422529., grad_fn=<MseLossBackward>)
output :  tensor([[170759.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(57810.1914, grad_fn=<MseLossBackward>)
output :  tensor([[139414.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(8496678., grad_fn=<MseLossBackward>)
output :  tensor([[126625.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(5638881., grad_fn=<MseLossBackward>)
output :  tensor([[122333.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(8029120.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145644.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2053e+08, grad_fn=<MseLossBackward>)
output :  tensor([[171510.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0589e+10, grad_fn=<MseLossBackward>)
output :  tensor([[148238.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2137124.2500, grad_fn=<MseLossBackward>)
output :  tensor([[181890.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(3573222.2500, grad_fn=<MseLossBackward>)
output :  tensor([[143429.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(5901787., grad_fn=<MseLossBackward>)
output :  tensor([[109378.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7554e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136947.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0922e+09, grad_fn=<MseLossBackward>)
output :  tensor([[132105.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(8378763.5000, grad_fn=<MseLossBackward>)
output :  tensor([[132753.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(33097368., grad_fn=<MseLossBackward>)
output :  tensor([[225651.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(424045.1562, grad_fn=<MseLossBackward>)
output :  tensor([[133430.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1394502.6250, grad_fn=<MseLossBackward>)
output :  tensor([[149104.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(10838.7617, grad_fn=<MseLossBackward>)
output :  tensor([[112318.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(101397.4688, grad_fn=<MseLossBackward>)
output :  tensor([[161743.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(3038593.7500, grad_fn=<MseLossBackward>)
output :  tensor([[147944.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2142e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192353.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(125271.7500, grad_fn=<MseLossBackward>)
output :  tensor([[134757.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(94306.5703, grad_fn=<MseLossBackward>)
output :  tensor([[105047.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(24525012., grad_fn=<MseLossBackward>)
output :  tensor([[233605.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(155371.4688, grad_fn=<MseLossBackward>)
output :  tensor([[164883.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3626e+09, grad_fn=<MseLossBackward>)
output :  tensor([[155332.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(13448723., grad_fn=<MseLossBackward>)
output :  tensor([[205206.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7987e+10, grad_fn=<MseLossBackward>)
output :  tensor([[239523.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3105e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145562.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(4253261.5000, grad_fn=<MseLossBackward>)
output :  tensor([[137511.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(12328877., grad_fn=<MseLossBackward>)
output :  tensor([[156667.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2781077.2500, grad_fn=<MseLossBackward>)
output :  tensor([[134932.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(24326936., grad_fn=<MseLossBackward>)
output :  tensor([[184037.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7703e+09, grad_fn=<MseLossBackward>)
output :  tensor([[184975.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(766254.0625, grad_fn=<MseLossBackward>)
output :  tensor([[165446.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(15574739., grad_fn=<MseLossBackward>)
output :  tensor([[134194.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(77529400., grad_fn=<MseLossBackward>)
output :  tensor([[143300.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(640300.0625, grad_fn=<MseLossBackward>)
output :  tensor([[148010.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(9063110., grad_fn=<MseLossBackward>)
output :  tensor([[171239.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6850e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192758.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8764e+08, grad_fn=<MseLossBackward>)
output :  tensor([[139591.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(9554667., grad_fn=<MseLossBackward>)
output :  tensor([[169829.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(4288652.5000, grad_fn=<MseLossBackward>)
output :  tensor([[179797.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1446006.2500, grad_fn=<MseLossBackward>)
output :  tensor([[117384.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(5687517., grad_fn=<MseLossBackward>)
output :  tensor([[219032.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(3872101.5000, grad_fn=<MseLossBackward>)
output :  tensor([[183514.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(223.5959, grad_fn=<MseLossBackward>)
output :  tensor([[126684.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(1403947.2500, grad_fn=<MseLossBackward>)
output :  tensor([[194583.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3673092., grad_fn=<MseLossBackward>)
output :  tensor([[177468.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(6597834.5000, grad_fn=<MseLossBackward>)
output :  tensor([[208346.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1650e+10, grad_fn=<MseLossBackward>)
output :  tensor([[206929.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(16567571., grad_fn=<MseLossBackward>)
output :  tensor([[172231.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7000e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193691.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(653950.1875, grad_fn=<MseLossBackward>)
output :  tensor([[112296.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(495484., grad_fn=<MseLossBackward>)
output :  tensor([[114786.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(5229547., grad_fn=<MseLossBackward>)
output :  tensor([[109407.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(6718504.5000, grad_fn=<MseLossBackward>)
output :  tensor([[147663.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(745551.3125, grad_fn=<MseLossBackward>)
output :  tensor([[159339.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3600e+10, grad_fn=<MseLossBackward>)
output :  tensor([[179389.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(372729.3438, grad_fn=<MseLossBackward>)
output :  tensor([[129673.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(4723253.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145905.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(819223., grad_fn=<MseLossBackward>)
output :  tensor([[184431.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4533e+09, grad_fn=<MseLossBackward>)
output :  tensor([[118727.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(3340698.5000, grad_fn=<MseLossBackward>)
output :  tensor([[194473.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(6385650., grad_fn=<MseLossBackward>)
output :  tensor([[143267.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(3000527.7500, grad_fn=<MseLossBackward>)
output :  tensor([[215229.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(5428172., grad_fn=<MseLossBackward>)
output :  tensor([[128162.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(4676271., grad_fn=<MseLossBackward>)
output :  tensor([[248215.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(12712.5625, grad_fn=<MseLossBackward>)
output :  tensor([[235958.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4051e+09, grad_fn=<MseLossBackward>)
output :  tensor([[152044.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2620e+08, grad_fn=<MseLossBackward>)
output :  tensor([[87487.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0157e+08, grad_fn=<MseLossBackward>)
output :  tensor([[190646.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0986e+09, grad_fn=<MseLossBackward>)
output :  tensor([[85046.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(16373087., grad_fn=<MseLossBackward>)
output :  tensor([[138066.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2054743.1250, grad_fn=<MseLossBackward>)
output :  tensor([[78503.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(9019464., grad_fn=<MseLossBackward>)
output :  tensor([[141805.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1316469.3750, grad_fn=<MseLossBackward>)
output :  tensor([[176206.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(42461.7539, grad_fn=<MseLossBackward>)
output :  tensor([[152448.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1105159.3750, grad_fn=<MseLossBackward>)
output :  tensor([[110192.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(7799801.5000, grad_fn=<MseLossBackward>)
output :  tensor([[200919.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3186e+10, grad_fn=<MseLossBackward>)
output :  tensor([[127627.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(761869.8750, grad_fn=<MseLossBackward>)
output :  tensor([[265662.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0556e+08, grad_fn=<MseLossBackward>)
output :  tensor([[300796.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(84699232., grad_fn=<MseLossBackward>)
output :  tensor([[111900.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(19365776., grad_fn=<MseLossBackward>)
output :  tensor([[169902.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(6748467.5000, grad_fn=<MseLossBackward>)
output :  tensor([[133648.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5783e+08, grad_fn=<MseLossBackward>)
output :  tensor([[146085.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(50201652., grad_fn=<MseLossBackward>)
output :  tensor([[127800.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(6001045.5000, grad_fn=<MseLossBackward>)
output :  tensor([[124336.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(440512.2188, grad_fn=<MseLossBackward>)
output :  tensor([[135193.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6014e+08, grad_fn=<MseLossBackward>)
output :  tensor([[226938.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8440e+10, grad_fn=<MseLossBackward>)
output :  tensor([[187192.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3657e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143523.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(141764.0156, grad_fn=<MseLossBackward>)
output :  tensor([[129479.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(3919317.2500, grad_fn=<MseLossBackward>)
output :  tensor([[111255.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(30.3360, grad_fn=<MseLossBackward>)
output :  tensor([[252153.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3439e+09, grad_fn=<MseLossBackward>)
output :  tensor([[134686.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(98252.8594, grad_fn=<MseLossBackward>)
output :  tensor([[196284.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(45095004., grad_fn=<MseLossBackward>)
output :  tensor([[102088.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(7905498.5000, grad_fn=<MseLossBackward>)
output :  tensor([[141293.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1805538.1250, grad_fn=<MseLossBackward>)
output :  tensor([[205884.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4654e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177130.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(7668226.5000, grad_fn=<MseLossBackward>)
output :  tensor([[188023.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(9141552., grad_fn=<MseLossBackward>)
output :  tensor([[163348.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1214e+10, grad_fn=<MseLossBackward>)
output :  tensor([[294372.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6506e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195795.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(4428262.5000, grad_fn=<MseLossBackward>)
output :  tensor([[262819.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9612e+10, grad_fn=<MseLossBackward>)
output :  tensor([[216641.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4363e+09, grad_fn=<MseLossBackward>)
output :  tensor([[274662.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7925e+09, grad_fn=<MseLossBackward>)
output :  tensor([[224435.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(189565., grad_fn=<MseLossBackward>)
output :  tensor([[222918.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8589e+10, grad_fn=<MseLossBackward>)
output :  tensor([[196168.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(691938., grad_fn=<MseLossBackward>)
output :  tensor([[159803.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(9.4887e+08, grad_fn=<MseLossBackward>)
output :  tensor([[132182.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(100607.9062, grad_fn=<MseLossBackward>)
output :  tensor([[136133.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(401757.9062, grad_fn=<MseLossBackward>)
output :  tensor([[90600.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(159282.0625, grad_fn=<MseLossBackward>)
output :  tensor([[109340.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1796772.7500, grad_fn=<MseLossBackward>)
output :  tensor([[273252.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0967e+09, grad_fn=<MseLossBackward>)
output :  tensor([[236326.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1759022., grad_fn=<MseLossBackward>)
output :  tensor([[145303.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(92378., grad_fn=<MseLossBackward>)
output :  tensor([[139053.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2413750.7500, grad_fn=<MseLossBackward>)
output :  tensor([[175913.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(4753354., grad_fn=<MseLossBackward>)
output :  tensor([[141840.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(11624371., grad_fn=<MseLossBackward>)
output :  tensor([[164793.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8247e+08, grad_fn=<MseLossBackward>)
output :  tensor([[164891.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(11829.9609, grad_fn=<MseLossBackward>)
output :  tensor([[138968.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(3874438.7500, grad_fn=<MseLossBackward>)
output :  tensor([[190834.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6696e+09, grad_fn=<MseLossBackward>)
output :  tensor([[112846.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(715729.2500, grad_fn=<MseLossBackward>)
output :  tensor([[172936.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(876417.7500, grad_fn=<MseLossBackward>)
output :  tensor([[120357.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(127962.7031, grad_fn=<MseLossBackward>)
output :  tensor([[87474.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(224794.5156, grad_fn=<MseLossBackward>)
output :  tensor([[179074.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(856347.8125, grad_fn=<MseLossBackward>)
output :  tensor([[113168.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(10682326., grad_fn=<MseLossBackward>)
output :  tensor([[239994.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(989434.3125, grad_fn=<MseLossBackward>)
output :  tensor([[246662.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2764010.2500, grad_fn=<MseLossBackward>)
output :  tensor([[131167.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2781911.2500, grad_fn=<MseLossBackward>)
output :  tensor([[112816.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(14877413., grad_fn=<MseLossBackward>)
output :  tensor([[288831.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2000e+10, grad_fn=<MseLossBackward>)
output :  tensor([[174472.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(8832970., grad_fn=<MseLossBackward>)
output :  tensor([[128395.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(11531489., grad_fn=<MseLossBackward>)
output :  tensor([[146982.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3998e+08, grad_fn=<MseLossBackward>)
output :  tensor([[198119.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5219e+08, grad_fn=<MseLossBackward>)
output :  tensor([[142101.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1212545.1250, grad_fn=<MseLossBackward>)
output :  tensor([[157469.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5014e+10, grad_fn=<MseLossBackward>)
output :  tensor([[157566.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(13446660., grad_fn=<MseLossBackward>)
output :  tensor([[133294.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(14396096., grad_fn=<MseLossBackward>)
output :  tensor([[240653.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9002e+10, grad_fn=<MseLossBackward>)
output :  tensor([[401379.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(384942.6875, grad_fn=<MseLossBackward>)
output :  tensor([[111270.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(5156021.5000, grad_fn=<MseLossBackward>)
output :  tensor([[115915.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(6682144., grad_fn=<MseLossBackward>)
output :  tensor([[159179.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(102890.5859, grad_fn=<MseLossBackward>)
output :  tensor([[132061.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8131e+08, grad_fn=<MseLossBackward>)
output :  tensor([[162432.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5482e+09, grad_fn=<MseLossBackward>)
output :  tensor([[169757.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5710e+09, grad_fn=<MseLossBackward>)
output :  tensor([[103423.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(31069.5703, grad_fn=<MseLossBackward>)
output :  tensor([[138572.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(5892377., grad_fn=<MseLossBackward>)
output :  tensor([[367322.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(808.6914, grad_fn=<MseLossBackward>)
output :  tensor([[199857.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9314e+09, grad_fn=<MseLossBackward>)
output :  tensor([[172135.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(11322384., grad_fn=<MseLossBackward>)
output :  tensor([[199990.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(8467373., grad_fn=<MseLossBackward>)
output :  tensor([[138866.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(17818.0781, grad_fn=<MseLossBackward>)
output :  tensor([[193471.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1057201.6250, grad_fn=<MseLossBackward>)
output :  tensor([[136617.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4784e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177789.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(10305404., grad_fn=<MseLossBackward>)
output :  tensor([[239167.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(8020489.5000, grad_fn=<MseLossBackward>)
output :  tensor([[170555.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(11863719., grad_fn=<MseLossBackward>)
output :  tensor([[110681.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(7192495.5000, grad_fn=<MseLossBackward>)
output :  tensor([[265570.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1019090.2500, grad_fn=<MseLossBackward>)
output :  tensor([[248697.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1696099.2500, grad_fn=<MseLossBackward>)
output :  tensor([[121458.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(2376824.5000, grad_fn=<MseLossBackward>)
output :  tensor([[213583.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7720e+09, grad_fn=<MseLossBackward>)
output :  tensor([[303413.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7903e+08, grad_fn=<MseLossBackward>)
output :  tensor([[205786.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1471672.2500, grad_fn=<MseLossBackward>)
output :  tensor([[214221.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5820e+10, grad_fn=<MseLossBackward>)
output :  tensor([[158675.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(601424.5000, grad_fn=<MseLossBackward>)
output :  tensor([[172686.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(7270101., grad_fn=<MseLossBackward>)
output :  tensor([[161002.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(16570497., grad_fn=<MseLossBackward>)
output :  tensor([[174151.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(17238066., grad_fn=<MseLossBackward>)
output :  tensor([[230257.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4245e+09, grad_fn=<MseLossBackward>)
output :  tensor([[210950.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4246e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163324.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6650e+08, grad_fn=<MseLossBackward>)
output :  tensor([[125267.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(5139926.5000, grad_fn=<MseLossBackward>)
output :  tensor([[175568.]], grad_fn=<AddmmBackward>)
loss:  tensor(2050624., grad_fn=<MseLossBackward>)
output :  tensor([[179092.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5460e+09, grad_fn=<MseLossBackward>)
output :  tensor([[202836.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6780e+10, grad_fn=<MseLossBackward>)
output :  tensor([[136739.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(5324917., grad_fn=<MseLossBackward>)
output :  tensor([[153286.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0041e+09, grad_fn=<MseLossBackward>)
output :  tensor([[278146.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1315250.6250, grad_fn=<MseLossBackward>)
output :  tensor([[83826.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(1377230.6250, grad_fn=<MseLossBackward>)
output :  tensor([[234960.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2371070.7500, grad_fn=<MseLossBackward>)
output :  tensor([[256417.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0661e+11, grad_fn=<MseLossBackward>)
output :  tensor([[169928.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(5063.2119, grad_fn=<MseLossBackward>)
output :  tensor([[191748.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8707e+09, grad_fn=<MseLossBackward>)
output :  tensor([[154938.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(3753.4768, grad_fn=<MseLossBackward>)
output :  tensor([[205267.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1903e+09, grad_fn=<MseLossBackward>)
output :  tensor([[129578.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(334183.3438, grad_fn=<MseLossBackward>)
output :  tensor([[149013.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(16108809., grad_fn=<MseLossBackward>)
output :  tensor([[171110.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1856e+08, grad_fn=<MseLossBackward>)
output :  tensor([[184064.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(3189517., grad_fn=<MseLossBackward>)
output :  tensor([[129690.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(13616907., grad_fn=<MseLossBackward>)
output :  tensor([[139137.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(6956241.5000, grad_fn=<MseLossBackward>)
output :  tensor([[172866.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(17822.2500, grad_fn=<MseLossBackward>)
output :  tensor([[200211.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4789e+09, grad_fn=<MseLossBackward>)
output :  tensor([[239672.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(11074336., grad_fn=<MseLossBackward>)
output :  tensor([[153307.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2863763., grad_fn=<MseLossBackward>)
output :  tensor([[196579.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(335494.3750, grad_fn=<MseLossBackward>)
output :  tensor([[165058.]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4344e+08, grad_fn=<MseLossBackward>)
output :  tensor([[196373.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8472e+08, grad_fn=<MseLossBackward>)
output :  tensor([[183725.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(14631223., grad_fn=<MseLossBackward>)
output :  tensor([[97960.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(923085.6250, grad_fn=<MseLossBackward>)
output :  tensor([[174628.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1103e+10, grad_fn=<MseLossBackward>)
output :  tensor([[136208.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1460132.3750, grad_fn=<MseLossBackward>)
output :  tensor([[123172.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(66782732., grad_fn=<MseLossBackward>)
output :  tensor([[174010.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(107.3167, grad_fn=<MseLossBackward>)
output :  tensor([[87391.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(5721028.5000, grad_fn=<MseLossBackward>)
output :  tensor([[293798.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(14429077., grad_fn=<MseLossBackward>)
output :  tensor([[164243.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(572765.1875, grad_fn=<MseLossBackward>)
output :  tensor([[187985.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1078e+10, grad_fn=<MseLossBackward>)
output :  tensor([[243217.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7185e+08, grad_fn=<MseLossBackward>)
output :  tensor([[150240.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(576958.9375, grad_fn=<MseLossBackward>)
output :  tensor([[122484.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(2296101., grad_fn=<MseLossBackward>)
output :  tensor([[118212.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(2848843., grad_fn=<MseLossBackward>)
output :  tensor([[141840.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2041e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174454.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(206499.2344, grad_fn=<MseLossBackward>)
output :  tensor([[111130.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1969e+08, grad_fn=<MseLossBackward>)
output :  tensor([[204769.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2821e+10, grad_fn=<MseLossBackward>)
output :  tensor([[234859.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(44091884., grad_fn=<MseLossBackward>)
output :  tensor([[249337.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1273e+10, grad_fn=<MseLossBackward>)
output :  tensor([[222224.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8142e+08, grad_fn=<MseLossBackward>)
output :  tensor([[193402.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4908e+10, grad_fn=<MseLossBackward>)
output :  tensor([[189157.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2747565.2500, grad_fn=<MseLossBackward>)
output :  tensor([[205300.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8211e+10, grad_fn=<MseLossBackward>)
output :  tensor([[184655.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2905e+10, grad_fn=<MseLossBackward>)
output :  tensor([[177693.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1095489.2500, grad_fn=<MseLossBackward>)
output :  tensor([[156140.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(17143740., grad_fn=<MseLossBackward>)
output :  tensor([[337960.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(922380.1875, grad_fn=<MseLossBackward>)
output :  tensor([[210192.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3267903.5000, grad_fn=<MseLossBackward>)
output :  tensor([[160818.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(670402.7500, grad_fn=<MseLossBackward>)
output :  tensor([[185218.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1676e+09, grad_fn=<MseLossBackward>)
output :  tensor([[104697.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(91468.4375, grad_fn=<MseLossBackward>)
output :  tensor([[269920.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1270e+10, grad_fn=<MseLossBackward>)
output :  tensor([[169396.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(20278416., grad_fn=<MseLossBackward>)
output :  tensor([[213641.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(19995.7266, grad_fn=<MseLossBackward>)
output :  tensor([[205637.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3599e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175970.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(10428863., grad_fn=<MseLossBackward>)
output :  tensor([[204993.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(10200738., grad_fn=<MseLossBackward>)
output :  tensor([[158270.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(10694739., grad_fn=<MseLossBackward>)
output :  tensor([[152716.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7790e+09, grad_fn=<MseLossBackward>)
output :  tensor([[119032.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(283148.6875, grad_fn=<MseLossBackward>)
output :  tensor([[139575.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(180160.4531, grad_fn=<MseLossBackward>)
output :  tensor([[146876.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(4508190.5000, grad_fn=<MseLossBackward>)
output :  tensor([[201881.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5906e+10, grad_fn=<MseLossBackward>)
output :  tensor([[159694.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(37860.6484, grad_fn=<MseLossBackward>)
output :  tensor([[100777.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(1631507.2500, grad_fn=<MseLossBackward>)
output :  tensor([[222592.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0302e+08, grad_fn=<MseLossBackward>)
output :  tensor([[185774.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1107e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176078.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(165331.1875, grad_fn=<MseLossBackward>)
output :  tensor([[85599.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(12954713., grad_fn=<MseLossBackward>)
output :  tensor([[127188.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1720401.1250, grad_fn=<MseLossBackward>)
output :  tensor([[217231.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(10439664., grad_fn=<MseLossBackward>)
output :  tensor([[142400.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2559100., grad_fn=<MseLossBackward>)
output :  tensor([[129949.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2507.8186, grad_fn=<MseLossBackward>)
output :  tensor([[146352.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(14081256., grad_fn=<MseLossBackward>)
output :  tensor([[181283.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9170e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146495.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(6225960.5000, grad_fn=<MseLossBackward>)
output :  tensor([[160663.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(440418.8750, grad_fn=<MseLossBackward>)
output :  tensor([[215048.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2329.5706, grad_fn=<MseLossBackward>)
output :  tensor([[140213.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2400e+09, grad_fn=<MseLossBackward>)
output :  tensor([[256320.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1743513.8750, grad_fn=<MseLossBackward>)
output :  tensor([[161146.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2710756.5000, grad_fn=<MseLossBackward>)
output :  tensor([[125632.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(8221794.5000, grad_fn=<MseLossBackward>)
output :  tensor([[95716.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(514066.5938, grad_fn=<MseLossBackward>)
output :  tensor([[153132.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7104e+09, grad_fn=<MseLossBackward>)
output :  tensor([[177820.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(4326075., grad_fn=<MseLossBackward>)
output :  tensor([[121512.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(1024887.3125, grad_fn=<MseLossBackward>)
output :  tensor([[185640.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8757e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146674.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5124e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151391.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2224106.2500, grad_fn=<MseLossBackward>)
output :  tensor([[189519.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(3131351.5000, grad_fn=<MseLossBackward>)
output :  tensor([[252260.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6660e+09, grad_fn=<MseLossBackward>)
output :  tensor([[91488.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(138.7979, grad_fn=<MseLossBackward>)
output :  tensor([[235127.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(23742626., grad_fn=<MseLossBackward>)
output :  tensor([[130026.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(2329606., grad_fn=<MseLossBackward>)
output :  tensor([[166284.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9232e+09, grad_fn=<MseLossBackward>)
output :  tensor([[114806.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1924e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177097.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1203751.8750, grad_fn=<MseLossBackward>)
output :  tensor([[162957.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5498e+08, grad_fn=<MseLossBackward>)
output :  tensor([[156764.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8980e+08, grad_fn=<MseLossBackward>)
output :  tensor([[233850.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(26513650., grad_fn=<MseLossBackward>)
output :  tensor([[228933.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4486e+08, grad_fn=<MseLossBackward>)
output :  tensor([[124803.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(4825504.5000, grad_fn=<MseLossBackward>)
output :  tensor([[123459.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(6454894.5000, grad_fn=<MseLossBackward>)
output :  tensor([[224380.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(6862107.5000, grad_fn=<MseLossBackward>)
output :  tensor([[231042.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(8749487., grad_fn=<MseLossBackward>)
output :  tensor([[221180.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(30461258., grad_fn=<MseLossBackward>)
output :  tensor([[145253.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(7545751.5000, grad_fn=<MseLossBackward>)
output :  tensor([[207667.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(5440629., grad_fn=<MseLossBackward>)
output :  tensor([[129942.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(98861848., grad_fn=<MseLossBackward>)
output :  tensor([[135470.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(8822199., grad_fn=<MseLossBackward>)
output :  tensor([[304537.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0946e+08, grad_fn=<MseLossBackward>)
output :  tensor([[143146.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(4607328., grad_fn=<MseLossBackward>)
output :  tensor([[121191.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9368e+09, grad_fn=<MseLossBackward>)
output :  tensor([[109480.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(384.5276, grad_fn=<MseLossBackward>)
output :  tensor([[154779.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1401e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178395.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2793e+09, grad_fn=<MseLossBackward>)
output :  tensor([[171498.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2254736.7500, grad_fn=<MseLossBackward>)
output :  tensor([[189198.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3929e+08, grad_fn=<MseLossBackward>)
output :  tensor([[96519.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(12115892., grad_fn=<MseLossBackward>)
output :  tensor([[175026.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(15786095., grad_fn=<MseLossBackward>)
output :  tensor([[168922.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1045793.8750, grad_fn=<MseLossBackward>)
output :  tensor([[137462.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2364194.5000, grad_fn=<MseLossBackward>)
output :  tensor([[252064.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1457e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143185.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3855e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174294.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1675042.6250, grad_fn=<MseLossBackward>)
output :  tensor([[138712.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1658461., grad_fn=<MseLossBackward>)
output :  tensor([[204551.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(16418324., grad_fn=<MseLossBackward>)
output :  tensor([[168196.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(3251147., grad_fn=<MseLossBackward>)
output :  tensor([[242393.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2581595.2500, grad_fn=<MseLossBackward>)
output :  tensor([[134620.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(14475.0977, grad_fn=<MseLossBackward>)
output :  tensor([[151150.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(3241181.2500, grad_fn=<MseLossBackward>)
output :  tensor([[216362.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1856576.6250, grad_fn=<MseLossBackward>)
output :  tensor([[164618.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(145327.7344, grad_fn=<MseLossBackward>)
output :  tensor([[198946.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(98935040., grad_fn=<MseLossBackward>)
output :  tensor([[134782.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8651e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131385.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(5688597.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138354.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2708698.7500, grad_fn=<MseLossBackward>)
output :  tensor([[198140.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0921e+09, grad_fn=<MseLossBackward>)
output :  tensor([[165575.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5578e+09, grad_fn=<MseLossBackward>)
output :  tensor([[79334.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7384e+08, grad_fn=<MseLossBackward>)
output :  tensor([[94434.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(98686688., grad_fn=<MseLossBackward>)
output :  tensor([[252980.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(97841.8828, grad_fn=<MseLossBackward>)
output :  tensor([[203161.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1167e+09, grad_fn=<MseLossBackward>)
output :  tensor([[116681.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(2826890.5000, grad_fn=<MseLossBackward>)
output :  tensor([[155372.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0322e+09, grad_fn=<MseLossBackward>)
output :  tensor([[202539.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0486e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179776.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1402e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157807.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(7880214., grad_fn=<MseLossBackward>)
output :  tensor([[167478.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(6357883.5000, grad_fn=<MseLossBackward>)
output :  tensor([[114168.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(691236.3750, grad_fn=<MseLossBackward>)
output :  tensor([[165514.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1055e+08, grad_fn=<MseLossBackward>)
output :  tensor([[191796.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2811e+08, grad_fn=<MseLossBackward>)
output :  tensor([[219751.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(63267.9688, grad_fn=<MseLossBackward>)
output :  tensor([[242515.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5249e+11, grad_fn=<MseLossBackward>)
output :  tensor([[147751.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(565457., grad_fn=<MseLossBackward>)
output :  tensor([[109548.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(1141575.3750, grad_fn=<MseLossBackward>)
output :  tensor([[168245.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8646e+08, grad_fn=<MseLossBackward>)
output :  tensor([[155697.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(27011732., grad_fn=<MseLossBackward>)
output :  tensor([[235614.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1919913.3750, grad_fn=<MseLossBackward>)
output :  tensor([[116359.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1849472.5000, grad_fn=<MseLossBackward>)
output :  tensor([[182995.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(9096.3906, grad_fn=<MseLossBackward>)
output :  tensor([[189063.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(5585024.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163122.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4611e+10, grad_fn=<MseLossBackward>)
output :  tensor([[97574.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7471e+08, grad_fn=<MseLossBackward>)
output :  tensor([[235732.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(10675841., grad_fn=<MseLossBackward>)
output :  tensor([[179736.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(13964118., grad_fn=<MseLossBackward>)
output :  tensor([[140373.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(139537.2656, grad_fn=<MseLossBackward>)
output :  tensor([[235672.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(452487.4375, grad_fn=<MseLossBackward>)
output :  tensor([[164381.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1908671.7500, grad_fn=<MseLossBackward>)
output :  tensor([[199574.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5732e+10, grad_fn=<MseLossBackward>)
output :  tensor([[133317.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2831805.2500, grad_fn=<MseLossBackward>)
output :  tensor([[185984.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7528e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136158.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(24993.6328, grad_fn=<MseLossBackward>)
output :  tensor([[223557.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5481e+08, grad_fn=<MseLossBackward>)
output :  tensor([[222130.]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7674e+08, grad_fn=<MseLossBackward>)
output :  tensor([[90754.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(568598.5000, grad_fn=<MseLossBackward>)
output :  tensor([[158448.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(971179.4375, grad_fn=<MseLossBackward>)
output :  tensor([[243646.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6188e+10, grad_fn=<MseLossBackward>)
output :  tensor([[146801.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(3244501.5000, grad_fn=<MseLossBackward>)
output :  tensor([[112994.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1155e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163651.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(719713.6250, grad_fn=<MseLossBackward>)
output :  tensor([[143693.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(94172.2656, grad_fn=<MseLossBackward>)
output :  tensor([[130093.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(3584957.7500, grad_fn=<MseLossBackward>)
output :  tensor([[189659.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8081e+09, grad_fn=<MseLossBackward>)
output :  tensor([[121817.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(466371.6250, grad_fn=<MseLossBackward>)
output :  tensor([[152773.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(597915.5625, grad_fn=<MseLossBackward>)
output :  tensor([[169220.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(6396236., grad_fn=<MseLossBackward>)
output :  tensor([[152241.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1540585.2500, grad_fn=<MseLossBackward>)
output :  tensor([[158076.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(23266756., grad_fn=<MseLossBackward>)
output :  tensor([[135713.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1361e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131040.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(920625.2500, grad_fn=<MseLossBackward>)
output :  tensor([[156486.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0579e+08, grad_fn=<MseLossBackward>)
output :  tensor([[146110.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(3836150.7500, grad_fn=<MseLossBackward>)
output :  tensor([[160070.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2822347.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140803.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(9.5501e+08, grad_fn=<MseLossBackward>)
output :  tensor([[150373.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2475164.7500, grad_fn=<MseLossBackward>)
output :  tensor([[184434.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(12714127., grad_fn=<MseLossBackward>)
output :  tensor([[169295.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(87606.7500, grad_fn=<MseLossBackward>)
output :  tensor([[178672.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1761965.8750, grad_fn=<MseLossBackward>)
output :  tensor([[220118.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(14112.6973, grad_fn=<MseLossBackward>)
output :  tensor([[113682.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(33442638., grad_fn=<MseLossBackward>)
output :  tensor([[139813.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2242e+08, grad_fn=<MseLossBackward>)
output :  tensor([[282329.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(13469129., grad_fn=<MseLossBackward>)
output :  tensor([[117468.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2156538.2500, grad_fn=<MseLossBackward>)
output :  tensor([[175562.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9747e+09, grad_fn=<MseLossBackward>)
output :  tensor([[181221.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(14280605., grad_fn=<MseLossBackward>)
output :  tensor([[190843.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(28557502., grad_fn=<MseLossBackward>)
output :  tensor([[249508.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4983e+08, grad_fn=<MseLossBackward>)
output :  tensor([[218897.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(9625021., grad_fn=<MseLossBackward>)
output :  tensor([[135718.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8916e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175557.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0886e+08, grad_fn=<MseLossBackward>)
output :  tensor([[121618.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(5672844.5000, grad_fn=<MseLossBackward>)
output :  tensor([[182642.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5607e+10, grad_fn=<MseLossBackward>)
output :  tensor([[148359.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(21533660., grad_fn=<MseLossBackward>)
output :  tensor([[155519.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(81352792., grad_fn=<MseLossBackward>)
output :  tensor([[204789.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2281279.7500, grad_fn=<MseLossBackward>)
output :  tensor([[144051.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3344e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174434.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2450203.2500, grad_fn=<MseLossBackward>)
output :  tensor([[248961.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(9.3261e+08, grad_fn=<MseLossBackward>)
output :  tensor([[147919.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(6502.9102, grad_fn=<MseLossBackward>)
output :  tensor([[199547.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(9718709., grad_fn=<MseLossBackward>)
output :  tensor([[167519.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(57293544., grad_fn=<MseLossBackward>)
output :  tensor([[125966.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4415e+09, grad_fn=<MseLossBackward>)
output :  tensor([[134655.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1197246.2500, grad_fn=<MseLossBackward>)
output :  tensor([[179391.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(21235536., grad_fn=<MseLossBackward>)
output :  tensor([[194593.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(21104118., grad_fn=<MseLossBackward>)
output :  tensor([[218549.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9632e+09, grad_fn=<MseLossBackward>)
output :  tensor([[254880.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(4493936.5000, grad_fn=<MseLossBackward>)
output :  tensor([[180244.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9253e+10, grad_fn=<MseLossBackward>)
output :  tensor([[146266.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9993e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144720.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(48771.9609, grad_fn=<MseLossBackward>)
output :  tensor([[73420.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1169e+09, grad_fn=<MseLossBackward>)
output :  tensor([[130193.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(23101316., grad_fn=<MseLossBackward>)
output :  tensor([[133203.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(18523474., grad_fn=<MseLossBackward>)
output :  tensor([[154985.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(970717.5625, grad_fn=<MseLossBackward>)
output :  tensor([[134041.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(49587344., grad_fn=<MseLossBackward>)
output :  tensor([[77146.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(417871.3438, grad_fn=<MseLossBackward>)
output :  tensor([[83877.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(3524009., grad_fn=<MseLossBackward>)
output :  tensor([[220290.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3712e+08, grad_fn=<MseLossBackward>)
output :  tensor([[140866.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0465e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129703.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(634188.2500, grad_fn=<MseLossBackward>)
output :  tensor([[171179.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(17467176., grad_fn=<MseLossBackward>)
output :  tensor([[234339.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(436095.1250, grad_fn=<MseLossBackward>)
output :  tensor([[189966.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(4724306., grad_fn=<MseLossBackward>)
output :  tensor([[157735.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(3013099.2500, grad_fn=<MseLossBackward>)
output :  tensor([[198835.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(874867.9375, grad_fn=<MseLossBackward>)
output :  tensor([[197042.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5966e+09, grad_fn=<MseLossBackward>)
output :  tensor([[134562.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(5941939.5000, grad_fn=<MseLossBackward>)
output :  tensor([[153140.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(3457449.7500, grad_fn=<MseLossBackward>)
output :  tensor([[138245.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(5042831.5000, grad_fn=<MseLossBackward>)
output :  tensor([[196548.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1190e+09, grad_fn=<MseLossBackward>)
output :  tensor([[156012.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(4050345., grad_fn=<MseLossBackward>)
output :  tensor([[137201.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9098e+09, grad_fn=<MseLossBackward>)
output :  tensor([[141261.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(13235385., grad_fn=<MseLossBackward>)
output :  tensor([[203408.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(73812528., grad_fn=<MseLossBackward>)
output :  tensor([[107398.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4509e+08, grad_fn=<MseLossBackward>)
output :  tensor([[168395.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(801472.5625, grad_fn=<MseLossBackward>)
output :  tensor([[126900.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1209140.7500, grad_fn=<MseLossBackward>)
output :  tensor([[147903.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(816199.3125, grad_fn=<MseLossBackward>)
output :  tensor([[105077.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8228e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137916.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(173394.1719, grad_fn=<MseLossBackward>)
output :  tensor([[234797.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1446983.5000, grad_fn=<MseLossBackward>)
output :  tensor([[146911.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(3654011.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140571.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(9432577., grad_fn=<MseLossBackward>)
output :  tensor([[166157.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4560e+09, grad_fn=<MseLossBackward>)
output :  tensor([[261905.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5904e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174926.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(5399.9531, grad_fn=<MseLossBackward>)
output :  tensor([[102259.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(266618.9375, grad_fn=<MseLossBackward>)
output :  tensor([[199604.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0676e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157774.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1502999.3750, grad_fn=<MseLossBackward>)
output :  tensor([[162584.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6157e+10, grad_fn=<MseLossBackward>)
output :  tensor([[97623.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(457166.1562, grad_fn=<MseLossBackward>)
output :  tensor([[124619.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(1038918.3125, grad_fn=<MseLossBackward>)
output :  tensor([[158840.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(8068262.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140211.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(44811.5977, grad_fn=<MseLossBackward>)
output :  tensor([[200658.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(433478.2188, grad_fn=<MseLossBackward>)
output :  tensor([[143298.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1687076.2500, grad_fn=<MseLossBackward>)
output :  tensor([[262415.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(18453.5234, grad_fn=<MseLossBackward>)
output :  tensor([[130848.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4325e+09, grad_fn=<MseLossBackward>)
output :  tensor([[167370.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3497250.7500, grad_fn=<MseLossBackward>)
output :  tensor([[189317.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(668791.7500, grad_fn=<MseLossBackward>)
output :  tensor([[123135.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7254e+08, grad_fn=<MseLossBackward>)
output :  tensor([[254772.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(22778844., grad_fn=<MseLossBackward>)
output :  tensor([[157294.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8242e+08, grad_fn=<MseLossBackward>)
output :  tensor([[242672.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(7170261.5000, grad_fn=<MseLossBackward>)
output :  tensor([[146007.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(4029993.5000, grad_fn=<MseLossBackward>)
output :  tensor([[210665.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(443431.1250, grad_fn=<MseLossBackward>)
output :  tensor([[176189.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(14360902., grad_fn=<MseLossBackward>)
output :  tensor([[153302.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(486375.4688, grad_fn=<MseLossBackward>)
output :  tensor([[119767.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(3122316.5000, grad_fn=<MseLossBackward>)
output :  tensor([[236182.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5915e+09, grad_fn=<MseLossBackward>)
output :  tensor([[237032.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(8803460., grad_fn=<MseLossBackward>)
output :  tensor([[155445.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(4446101.5000, grad_fn=<MseLossBackward>)
output :  tensor([[250721.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(17456336., grad_fn=<MseLossBackward>)
output :  tensor([[120468.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(35579920., grad_fn=<MseLossBackward>)
output :  tensor([[175692.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(94268.1875, grad_fn=<MseLossBackward>)
output :  tensor([[159270.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(532033.5000, grad_fn=<MseLossBackward>)
output :  tensor([[134708.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(13751697., grad_fn=<MseLossBackward>)
output :  tensor([[198144.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7120e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166162.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(4674717., grad_fn=<MseLossBackward>)
output :  tensor([[166561.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(12685840., grad_fn=<MseLossBackward>)
output :  tensor([[157775.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(50554.7109, grad_fn=<MseLossBackward>)
output :  tensor([[145174.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(22333156., grad_fn=<MseLossBackward>)
output :  tensor([[174458.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2196e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161457.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2124534., grad_fn=<MseLossBackward>)
output :  tensor([[376490.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(55944324., grad_fn=<MseLossBackward>)
output :  tensor([[134296.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(53235036., grad_fn=<MseLossBackward>)
output :  tensor([[129148.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9052e+09, grad_fn=<MseLossBackward>)
output :  tensor([[280085.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1271467.6250, grad_fn=<MseLossBackward>)
output :  tensor([[161847.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(23380.3203, grad_fn=<MseLossBackward>)
output :  tensor([[130012.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(90489144., grad_fn=<MseLossBackward>)
output :  tensor([[231240.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(576555.5000, grad_fn=<MseLossBackward>)
output :  tensor([[178645.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3439170.2500, grad_fn=<MseLossBackward>)
output :  tensor([[153548.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2397416.7500, grad_fn=<MseLossBackward>)
output :  tensor([[143422.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2488161.2500, grad_fn=<MseLossBackward>)
output :  tensor([[157221.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1297e+08, grad_fn=<MseLossBackward>)
output :  tensor([[99383.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(379677.4062, grad_fn=<MseLossBackward>)
output :  tensor([[84634.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0687e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165097.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(9475.8057, grad_fn=<MseLossBackward>)
output :  tensor([[188592.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5529e+09, grad_fn=<MseLossBackward>)
output :  tensor([[155823.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(4737288.5000, grad_fn=<MseLossBackward>)
output :  tensor([[152703.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(23006712., grad_fn=<MseLossBackward>)
output :  tensor([[138815.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1865785.2500, grad_fn=<MseLossBackward>)
output :  tensor([[209568.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(13090489., grad_fn=<MseLossBackward>)
output :  tensor([[138446.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(199111.1719, grad_fn=<MseLossBackward>)
output :  tensor([[181668.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6469e+10, grad_fn=<MseLossBackward>)
output :  tensor([[147292.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1670152.3750, grad_fn=<MseLossBackward>)
output :  tensor([[112055.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4425e+08, grad_fn=<MseLossBackward>)
output :  tensor([[97928.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(15430964., grad_fn=<MseLossBackward>)
output :  tensor([[172974.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4100878.2500, grad_fn=<MseLossBackward>)
output :  tensor([[262003.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2570210.2500, grad_fn=<MseLossBackward>)
output :  tensor([[140207.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1671687.3750, grad_fn=<MseLossBackward>)
output :  tensor([[158761.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1285247.3750, grad_fn=<MseLossBackward>)
output :  tensor([[132795.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(87200.2422, grad_fn=<MseLossBackward>)
output :  tensor([[146338.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(9996564., grad_fn=<MseLossBackward>)
output :  tensor([[169859.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(3841477.5000, grad_fn=<MseLossBackward>)
output :  tensor([[126621.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(143629.1562, grad_fn=<MseLossBackward>)
output :  tensor([[175490.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2969e+08, grad_fn=<MseLossBackward>)
output :  tensor([[156041.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(918302.9375, grad_fn=<MseLossBackward>)
output :  tensor([[113127.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(11375126., grad_fn=<MseLossBackward>)
output :  tensor([[159446.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4101e+09, grad_fn=<MseLossBackward>)
output :  tensor([[55853.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(14845729., grad_fn=<MseLossBackward>)
output :  tensor([[234515.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0815e+09, grad_fn=<MseLossBackward>)
output :  tensor([[201546.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(298781.8125, grad_fn=<MseLossBackward>)
output :  tensor([[181985.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(9088152., grad_fn=<MseLossBackward>)
output :  tensor([[106746.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(557868.9375, grad_fn=<MseLossBackward>)
output :  tensor([[90684.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(13576749., grad_fn=<MseLossBackward>)
output :  tensor([[135651.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(18907550., grad_fn=<MseLossBackward>)
output :  tensor([[216959.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9352e+09, grad_fn=<MseLossBackward>)
output :  tensor([[199324.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(66838032., grad_fn=<MseLossBackward>)
output :  tensor([[169595.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(21118476., grad_fn=<MseLossBackward>)
output :  tensor([[171216.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7953e+09, grad_fn=<MseLossBackward>)
output :  tensor([[189275.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(524470.1875, grad_fn=<MseLossBackward>)
output :  tensor([[88721.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(2964073.2500, grad_fn=<MseLossBackward>)
output :  tensor([[139892.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(11495.8604, grad_fn=<MseLossBackward>)
output :  tensor([[112099.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(2559875., grad_fn=<MseLossBackward>)
output :  tensor([[151294.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3515e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172817.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7487e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194261.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1532e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177948.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(4209998.5000, grad_fn=<MseLossBackward>)
output :  tensor([[97957.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2123441., grad_fn=<MseLossBackward>)
output :  tensor([[119017.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2302332., grad_fn=<MseLossBackward>)
output :  tensor([[161022.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2797e+08, grad_fn=<MseLossBackward>)
output :  tensor([[195631.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(19087342., grad_fn=<MseLossBackward>)
output :  tensor([[143921.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(6172.0664, grad_fn=<MseLossBackward>)
train_loss: [2.670721e+09]
epoch_result tensor([0.])
output :  tensor([[158956.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(208749.0469, grad_fn=<MseLossBackward>)
output :  tensor([[120809.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(1417160., grad_fn=<MseLossBackward>)
output :  tensor([[195968.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3125326.7500, grad_fn=<MseLossBackward>)
output :  tensor([[176720.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(77910.7656, grad_fn=<MseLossBackward>)
output :  tensor([[155237.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1815e+08, grad_fn=<MseLossBackward>)
output :  tensor([[126328.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2794486.7500, grad_fn=<MseLossBackward>)
output :  tensor([[142931.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(3730752.5000, grad_fn=<MseLossBackward>)
output :  tensor([[122134.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(9826266., grad_fn=<MseLossBackward>)
output :  tensor([[69628.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2384e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166457.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(209306.2500, grad_fn=<MseLossBackward>)
output :  tensor([[142239.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(5016900., grad_fn=<MseLossBackward>)
output :  tensor([[224282.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(514380.3125, grad_fn=<MseLossBackward>)
output :  tensor([[169940.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(883658.7500, grad_fn=<MseLossBackward>)
output :  tensor([[248559.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1300205.7500, grad_fn=<MseLossBackward>)
output :  tensor([[53812.3945]], grad_fn=<AddmmBackward>)
loss:  tensor(1410406.7500, grad_fn=<MseLossBackward>)
output :  tensor([[163376.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5632e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177811.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(7906114., grad_fn=<MseLossBackward>)
output :  tensor([[171680.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3046e+08, grad_fn=<MseLossBackward>)
output :  tensor([[277020.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(4080778.7500, grad_fn=<MseLossBackward>)
output :  tensor([[196288.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(505743.2188, grad_fn=<MseLossBackward>)
output :  tensor([[136566.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6139e+10, grad_fn=<MseLossBackward>)
output :  tensor([[196122.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(5034764.5000, grad_fn=<MseLossBackward>)
output :  tensor([[179556.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0561e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150368.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(398713.3125, grad_fn=<MseLossBackward>)
output :  tensor([[169774.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(50772.7656, grad_fn=<MseLossBackward>)
output :  tensor([[89002.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(12974798., grad_fn=<MseLossBackward>)
output :  tensor([[168102.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0363e+09, grad_fn=<MseLossBackward>)
output :  tensor([[183678.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1745123.6250, grad_fn=<MseLossBackward>)
output :  tensor([[200854.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9861e+09, grad_fn=<MseLossBackward>)
output :  tensor([[110543.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(294967.7812, grad_fn=<MseLossBackward>)
output :  tensor([[168452.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(6487766., grad_fn=<MseLossBackward>)
output :  tensor([[133910.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(6705024.5000, grad_fn=<MseLossBackward>)
output :  tensor([[129463.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(214390.7031, grad_fn=<MseLossBackward>)
output :  tensor([[120733.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1521291., grad_fn=<MseLossBackward>)
output :  tensor([[147268.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(9.1617e+08, grad_fn=<MseLossBackward>)
output :  tensor([[171133.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0698e+10, grad_fn=<MseLossBackward>)
output :  tensor([[153716.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(16130641., grad_fn=<MseLossBackward>)
output :  tensor([[183037.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(9227545., grad_fn=<MseLossBackward>)
output :  tensor([[140479.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(271017.8438, grad_fn=<MseLossBackward>)
output :  tensor([[106982.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8840e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136429.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1733e+09, grad_fn=<MseLossBackward>)
output :  tensor([[131330.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(13467524., grad_fn=<MseLossBackward>)
output :  tensor([[139947.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6764e+08, grad_fn=<MseLossBackward>)
output :  tensor([[222702.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(5278003.5000, grad_fn=<MseLossBackward>)
output :  tensor([[131080.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1367949.5000, grad_fn=<MseLossBackward>)
output :  tensor([[146244.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(7590541.5000, grad_fn=<MseLossBackward>)
output :  tensor([[110738.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1592052.5000, grad_fn=<MseLossBackward>)
output :  tensor([[159581.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(174828.5156, grad_fn=<MseLossBackward>)
output :  tensor([[147571.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2494e+09, grad_fn=<MseLossBackward>)
output :  tensor([[189587.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(5818498., grad_fn=<MseLossBackward>)
output :  tensor([[133575.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(764695.6250, grad_fn=<MseLossBackward>)
output :  tensor([[120522.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1073e+08, grad_fn=<MseLossBackward>)
output :  tensor([[237157.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(9971188., grad_fn=<MseLossBackward>)
output :  tensor([[163479.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5011e+09, grad_fn=<MseLossBackward>)
output :  tensor([[165353.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(40362992., grad_fn=<MseLossBackward>)
output :  tensor([[204695.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8158e+10, grad_fn=<MseLossBackward>)
output :  tensor([[243710.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2164e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143861.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(130569.3047, grad_fn=<MseLossBackward>)
output :  tensor([[138548.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(20690132., grad_fn=<MseLossBackward>)
output :  tensor([[158933.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(15469718., grad_fn=<MseLossBackward>)
output :  tensor([[132066.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(4272295., grad_fn=<MseLossBackward>)
output :  tensor([[184642.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6788e+09, grad_fn=<MseLossBackward>)
output :  tensor([[179355.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(22511912., grad_fn=<MseLossBackward>)
output :  tensor([[164211.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(7350114., grad_fn=<MseLossBackward>)
output :  tensor([[143834.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(696494.5625, grad_fn=<MseLossBackward>)
output :  tensor([[140211.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(5235158.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140178.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(23250026., grad_fn=<MseLossBackward>)
output :  tensor([[171979.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5842e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194350.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1301e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136229.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(72933.7500, grad_fn=<MseLossBackward>)
output :  tensor([[176779.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(23807842., grad_fn=<MseLossBackward>)
output :  tensor([[177716.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(10779012., grad_fn=<MseLossBackward>)
output :  tensor([[114553.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(199452.9531, grad_fn=<MseLossBackward>)
output :  tensor([[225492.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(20184522., grad_fn=<MseLossBackward>)
output :  tensor([[180727.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(7688489., grad_fn=<MseLossBackward>)
output :  tensor([[125732.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(54168.9258, grad_fn=<MseLossBackward>)
output :  tensor([[196443.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(3232.9885, grad_fn=<MseLossBackward>)
output :  tensor([[174538.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(130388.6953, grad_fn=<MseLossBackward>)
output :  tensor([[208342.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1651e+10, grad_fn=<MseLossBackward>)
output :  tensor([[210634.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(133853.0781, grad_fn=<MseLossBackward>)
output :  tensor([[170775.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5821e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195871.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1882212.5000, grad_fn=<MseLossBackward>)
output :  tensor([[112580.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(176091.7031, grad_fn=<MseLossBackward>)
output :  tensor([[114739.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(5015780., grad_fn=<MseLossBackward>)
output :  tensor([[111409.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(348376.6250, grad_fn=<MseLossBackward>)
output :  tensor([[146438.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(130817.8438, grad_fn=<MseLossBackward>)
output :  tensor([[161854.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2684e+10, grad_fn=<MseLossBackward>)
output :  tensor([[183088.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(9539508., grad_fn=<MseLossBackward>)
output :  tensor([[129084.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(2512051.7500, grad_fn=<MseLossBackward>)
output :  tensor([[143504.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2236380., grad_fn=<MseLossBackward>)
output :  tensor([[188048.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8247e+09, grad_fn=<MseLossBackward>)
output :  tensor([[119754.4922]], grad_fn=<AddmmBackward>)
loss:  tensor(8148125.5000, grad_fn=<MseLossBackward>)
output :  tensor([[198967.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3870195.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145471.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(222769.2500, grad_fn=<MseLossBackward>)
output :  tensor([[211724.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1382204.3750, grad_fn=<MseLossBackward>)
output :  tensor([[127590.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2528149.7500, grad_fn=<MseLossBackward>)
output :  tensor([[248993.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(442495.1875, grad_fn=<MseLossBackward>)
output :  tensor([[236350.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3668e+09, grad_fn=<MseLossBackward>)
output :  tensor([[153111.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7138e+08, grad_fn=<MseLossBackward>)
output :  tensor([[88367.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4899e+08, grad_fn=<MseLossBackward>)
output :  tensor([[189631.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2708e+09, grad_fn=<MseLossBackward>)
output :  tensor([[82801.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(3243685.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139319.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(32676.2109, grad_fn=<MseLossBackward>)
output :  tensor([[77644.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(4600489., grad_fn=<MseLossBackward>)
output :  tensor([[141847.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1222061.1250, grad_fn=<MseLossBackward>)
output :  tensor([[174489.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2282648.7500, grad_fn=<MseLossBackward>)
output :  tensor([[153546.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2169.5217, grad_fn=<MseLossBackward>)
output :  tensor([[109889.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(6196521., grad_fn=<MseLossBackward>)
output :  tensor([[202397.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2849e+10, grad_fn=<MseLossBackward>)
output :  tensor([[130731.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(4981789., grad_fn=<MseLossBackward>)
output :  tensor([[268988.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2125e+08, grad_fn=<MseLossBackward>)
output :  tensor([[299848.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0306e+08, grad_fn=<MseLossBackward>)
output :  tensor([[108952.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(2108825.7500, grad_fn=<MseLossBackward>)
output :  tensor([[171207.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1670839., grad_fn=<MseLossBackward>)
output :  tensor([[135716.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6821e+08, grad_fn=<MseLossBackward>)
output :  tensor([[140415.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2002357.6250, grad_fn=<MseLossBackward>)
output :  tensor([[131357.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1226971.6250, grad_fn=<MseLossBackward>)
output :  tensor([[130883.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(34619156., grad_fn=<MseLossBackward>)
output :  tensor([[138623.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4816e+08, grad_fn=<MseLossBackward>)
output :  tensor([[227940.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8048e+10, grad_fn=<MseLossBackward>)
output :  tensor([[186483.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3875e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144615.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(512141.5000, grad_fn=<MseLossBackward>)
output :  tensor([[125909.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(2529168.5000, grad_fn=<MseLossBackward>)
output :  tensor([[110739.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(260139.8438, grad_fn=<MseLossBackward>)
output :  tensor([[253833.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1252e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137476.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(6134368., grad_fn=<MseLossBackward>)
output :  tensor([[199979.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(9120589., grad_fn=<MseLossBackward>)
output :  tensor([[107992.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(9565972., grad_fn=<MseLossBackward>)
output :  tensor([[140476.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(276840.4062, grad_fn=<MseLossBackward>)
output :  tensor([[205406.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6457e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178797.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1214920.6250, grad_fn=<MseLossBackward>)
output :  tensor([[185889.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(790960.1250, grad_fn=<MseLossBackward>)
output :  tensor([[164907.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0763e+10, grad_fn=<MseLossBackward>)
output :  tensor([[292908.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7717e+09, grad_fn=<MseLossBackward>)
output :  tensor([[196379.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2312965.7500, grad_fn=<MseLossBackward>)
output :  tensor([[259433.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0572e+10, grad_fn=<MseLossBackward>)
output :  tensor([[214273.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6757e+09, grad_fn=<MseLossBackward>)
output :  tensor([[277462.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5632e+09, grad_fn=<MseLossBackward>)
output :  tensor([[222942.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1118471.5000, grad_fn=<MseLossBackward>)
output :  tensor([[224214.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8152e+10, grad_fn=<MseLossBackward>)
output :  tensor([[196989.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(105.3831, grad_fn=<MseLossBackward>)
output :  tensor([[160684.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0039e+09, grad_fn=<MseLossBackward>)
output :  tensor([[135887.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(11478332., grad_fn=<MseLossBackward>)
output :  tensor([[130906.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(21095864., grad_fn=<MseLossBackward>)
output :  tensor([[92712.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(2931559.2500, grad_fn=<MseLossBackward>)
output :  tensor([[104474.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(12428104., grad_fn=<MseLossBackward>)
output :  tensor([[272625.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1669e+09, grad_fn=<MseLossBackward>)
output :  tensor([[235240.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(57742.5898, grad_fn=<MseLossBackward>)
output :  tensor([[147050.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(4202628., grad_fn=<MseLossBackward>)
output :  tensor([[138792.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1670233.1250, grad_fn=<MseLossBackward>)
output :  tensor([[173774.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1715.7717, grad_fn=<MseLossBackward>)
output :  tensor([[144131.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1250448.1250, grad_fn=<MseLossBackward>)
output :  tensor([[166137.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0442e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166371.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1881912.3750, grad_fn=<MseLossBackward>)
output :  tensor([[136392.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(369398.0625, grad_fn=<MseLossBackward>)
output :  tensor([[191525.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7645e+09, grad_fn=<MseLossBackward>)
output :  tensor([[114045.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(4185061., grad_fn=<MseLossBackward>)
output :  tensor([[168878.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(9744152., grad_fn=<MseLossBackward>)
output :  tensor([[119175.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(680612.1250, grad_fn=<MseLossBackward>)
output :  tensor([[87855.4922]], grad_fn=<AddmmBackward>)
loss:  tensor(731866.8750, grad_fn=<MseLossBackward>)
output :  tensor([[181188.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1411492.5000, grad_fn=<MseLossBackward>)
output :  tensor([[113489.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(12886081., grad_fn=<MseLossBackward>)
output :  tensor([[233409.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(31249672., grad_fn=<MseLossBackward>)
output :  tensor([[245499.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(249406.6094, grad_fn=<MseLossBackward>)
output :  tensor([[122991.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(42360064., grad_fn=<MseLossBackward>)
output :  tensor([[114528.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(31021418., grad_fn=<MseLossBackward>)
output :  tensor([[289006.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1948e+10, grad_fn=<MseLossBackward>)
output :  tensor([[175737.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(17954288., grad_fn=<MseLossBackward>)
output :  tensor([[124263.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(542961.7500, grad_fn=<MseLossBackward>)
output :  tensor([[146529.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1394e+08, grad_fn=<MseLossBackward>)
output :  tensor([[200768.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7507e+08, grad_fn=<MseLossBackward>)
output :  tensor([[140421.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(335005.8125, grad_fn=<MseLossBackward>)
output :  tensor([[156845.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5167e+10, grad_fn=<MseLossBackward>)
output :  tensor([[152529.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1879169.7500, grad_fn=<MseLossBackward>)
output :  tensor([[131012.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(2287869., grad_fn=<MseLossBackward>)
output :  tensor([[242327.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8543e+10, grad_fn=<MseLossBackward>)
output :  tensor([[403153.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1330057.6250, grad_fn=<MseLossBackward>)
output :  tensor([[112277.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(10742774., grad_fn=<MseLossBackward>)
output :  tensor([[128172.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(93560432., grad_fn=<MseLossBackward>)
output :  tensor([[161412.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(3658433.2500, grad_fn=<MseLossBackward>)
output :  tensor([[133799.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0807e+08, grad_fn=<MseLossBackward>)
output :  tensor([[159668.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8852e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174152.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1156e+09, grad_fn=<MseLossBackward>)
output :  tensor([[108324.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(22317874., grad_fn=<MseLossBackward>)
output :  tensor([[143945.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(8673945., grad_fn=<MseLossBackward>)
output :  tensor([[363159.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(17096932., grad_fn=<MseLossBackward>)
output :  tensor([[203903.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5096e+09, grad_fn=<MseLossBackward>)
output :  tensor([[179749.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(18054134., grad_fn=<MseLossBackward>)
output :  tensor([[208380.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(30031942., grad_fn=<MseLossBackward>)
output :  tensor([[137733.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1602874.7500, grad_fn=<MseLossBackward>)
output :  tensor([[195565.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1136089.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138920.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(9.8723e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177564.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(11799869., grad_fn=<MseLossBackward>)
output :  tensor([[239789.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(4885205., grad_fn=<MseLossBackward>)
output :  tensor([[173399.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(361144.6562, grad_fn=<MseLossBackward>)
output :  tensor([[112694.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(22036056., grad_fn=<MseLossBackward>)
output :  tensor([[263781.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(607181.8750, grad_fn=<MseLossBackward>)
output :  tensor([[251520.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2313298.5000, grad_fn=<MseLossBackward>)
output :  tensor([[127021.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(16175416., grad_fn=<MseLossBackward>)
output :  tensor([[212611.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8924e+09, grad_fn=<MseLossBackward>)
output :  tensor([[302564.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1691e+08, grad_fn=<MseLossBackward>)
output :  tensor([[207326.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(106745.1406, grad_fn=<MseLossBackward>)
output :  tensor([[211019.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6636e+10, grad_fn=<MseLossBackward>)
output :  tensor([[157892.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(63.7502, grad_fn=<MseLossBackward>)
output :  tensor([[167308.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(7189939.5000, grad_fn=<MseLossBackward>)
output :  tensor([[161702.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(22756328., grad_fn=<MseLossBackward>)
output :  tensor([[169439.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(313845.0625, grad_fn=<MseLossBackward>)
output :  tensor([[231543.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3291e+09, grad_fn=<MseLossBackward>)
output :  tensor([[213739.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4701e+08, grad_fn=<MseLossBackward>)
output :  tensor([[160488.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8193e+08, grad_fn=<MseLossBackward>)
output :  tensor([[122223.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(602709.6250, grad_fn=<MseLossBackward>)
output :  tensor([[178198.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1435765.6250, grad_fn=<MseLossBackward>)
output :  tensor([[180292.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3533e+09, grad_fn=<MseLossBackward>)
output :  tensor([[201209.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7406e+10, grad_fn=<MseLossBackward>)
output :  tensor([[136283.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(3426490.2500, grad_fn=<MseLossBackward>)
output :  tensor([[151528.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(8.9570e+08, grad_fn=<MseLossBackward>)
output :  tensor([[274035.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(8789928., grad_fn=<MseLossBackward>)
output :  tensor([[89126.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(17028002., grad_fn=<MseLossBackward>)
output :  tensor([[237956.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2122575.7500, grad_fn=<MseLossBackward>)
output :  tensor([[253648.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0843e+11, grad_fn=<MseLossBackward>)
output :  tensor([[172860.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(8183265., grad_fn=<MseLossBackward>)
output :  tensor([[188764.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1377e+09, grad_fn=<MseLossBackward>)
output :  tensor([[154181.]], grad_fn=<AddmmBackward>)
loss:  tensor(670761., grad_fn=<MseLossBackward>)
output :  tensor([[205796.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1221e+09, grad_fn=<MseLossBackward>)
output :  tensor([[127926.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1153442.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145494.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(244391.1875, grad_fn=<MseLossBackward>)
output :  tensor([[175047.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0593e+09, grad_fn=<MseLossBackward>)
output :  tensor([[185430.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(175927.8125, grad_fn=<MseLossBackward>)
output :  tensor([[128204.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(4860750.5000, grad_fn=<MseLossBackward>)
output :  tensor([[136540.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1632.6650, grad_fn=<MseLossBackward>)
output :  tensor([[178035.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(25354372., grad_fn=<MseLossBackward>)
output :  tensor([[200553.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4449e+09, grad_fn=<MseLossBackward>)
output :  tensor([[242206.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(629096.8125, grad_fn=<MseLossBackward>)
output :  tensor([[153196.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3254077.7500, grad_fn=<MseLossBackward>)
output :  tensor([[194705.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1675528., grad_fn=<MseLossBackward>)
output :  tensor([[161480.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0558e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176986.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(6315954.5000, grad_fn=<MseLossBackward>)
output :  tensor([[179858.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1688.6963, grad_fn=<MseLossBackward>)
output :  tensor([[93296.]], grad_fn=<AddmmBackward>)
loss:  tensor(13719616., grad_fn=<MseLossBackward>)
output :  tensor([[170814.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1922e+10, grad_fn=<MseLossBackward>)
output :  tensor([[132245.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(7584774., grad_fn=<MseLossBackward>)
output :  tensor([[120798.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(33618888., grad_fn=<MseLossBackward>)
output :  tensor([[173699.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(90347.2109, grad_fn=<MseLossBackward>)
output :  tensor([[89631.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(21446596., grad_fn=<MseLossBackward>)
output :  tensor([[287197.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(7852605., grad_fn=<MseLossBackward>)
output :  tensor([[166884.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(3552282.5000, grad_fn=<MseLossBackward>)
output :  tensor([[192016.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9924e+10, grad_fn=<MseLossBackward>)
output :  tensor([[242151.]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3226e+08, grad_fn=<MseLossBackward>)
output :  tensor([[149599.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1960131.2500, grad_fn=<MseLossBackward>)
output :  tensor([[122413.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(2515520., grad_fn=<MseLossBackward>)
output :  tensor([[120586.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(471357.3438, grad_fn=<MseLossBackward>)
output :  tensor([[147629.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0647e+09, grad_fn=<MseLossBackward>)
output :  tensor([[175623.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2634737.7500, grad_fn=<MseLossBackward>)
output :  tensor([[111411.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3590e+08, grad_fn=<MseLossBackward>)
output :  tensor([[204233.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2943e+10, grad_fn=<MseLossBackward>)
output :  tensor([[236205.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(28035866., grad_fn=<MseLossBackward>)
output :  tensor([[249445.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1242e+10, grad_fn=<MseLossBackward>)
output :  tensor([[220771.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3227e+08, grad_fn=<MseLossBackward>)
output :  tensor([[195227.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4465e+10, grad_fn=<MseLossBackward>)
output :  tensor([[189987.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(6188822.5000, grad_fn=<MseLossBackward>)
output :  tensor([[206340.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7755e+10, grad_fn=<MseLossBackward>)
output :  tensor([[186908.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2228e+10, grad_fn=<MseLossBackward>)
output :  tensor([[184728.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(35856704., grad_fn=<MseLossBackward>)
output :  tensor([[153932.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(3735220.5000, grad_fn=<MseLossBackward>)
output :  tensor([[337492.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(242710.1875, grad_fn=<MseLossBackward>)
output :  tensor([[212682.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(465870.2500, grad_fn=<MseLossBackward>)
output :  tensor([[157920.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(4323995.5000, grad_fn=<MseLossBackward>)
output :  tensor([[186426.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0331e+09, grad_fn=<MseLossBackward>)
output :  tensor([[111113.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(37378320., grad_fn=<MseLossBackward>)
output :  tensor([[267334.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2752e+10, grad_fn=<MseLossBackward>)
output :  tensor([[170576.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(11045237., grad_fn=<MseLossBackward>)
output :  tensor([[212259.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1537716.2500, grad_fn=<MseLossBackward>)
output :  tensor([[202402.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4585e+08, grad_fn=<MseLossBackward>)
output :  tensor([[182038.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(8056727.5000, grad_fn=<MseLossBackward>)
output :  tensor([[202362.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(315984.5000, grad_fn=<MseLossBackward>)
output :  tensor([[157164.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(4686481., grad_fn=<MseLossBackward>)
output :  tensor([[153168.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8269e+09, grad_fn=<MseLossBackward>)
output :  tensor([[117212.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1658662.2500, grad_fn=<MseLossBackward>)
output :  tensor([[139928.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(5107.7822, grad_fn=<MseLossBackward>)
output :  tensor([[145140.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(14896223., grad_fn=<MseLossBackward>)
output :  tensor([[200535.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6247e+10, grad_fn=<MseLossBackward>)
output :  tensor([[160367.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(752908.6875, grad_fn=<MseLossBackward>)
output :  tensor([[100828.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1765535., grad_fn=<MseLossBackward>)
output :  tensor([[226541.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8114e+08, grad_fn=<MseLossBackward>)
output :  tensor([[190111.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0572e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174904.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2497980.2500, grad_fn=<MseLossBackward>)
output :  tensor([[78148.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(14836038., grad_fn=<MseLossBackward>)
output :  tensor([[130903.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(5777300.5000, grad_fn=<MseLossBackward>)
output :  tensor([[213261.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(545843.9375, grad_fn=<MseLossBackward>)
output :  tensor([[143170.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(688588.8125, grad_fn=<MseLossBackward>)
output :  tensor([[129749.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(62953.9453, grad_fn=<MseLossBackward>)
output :  tensor([[144757.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(4656896.5000, grad_fn=<MseLossBackward>)
output :  tensor([[179831.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7920e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146544.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(6474082.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162114.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(4470449.5000, grad_fn=<MseLossBackward>)
output :  tensor([[212259.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(7509484., grad_fn=<MseLossBackward>)
output :  tensor([[141294.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3173e+09, grad_fn=<MseLossBackward>)
output :  tensor([[253702.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1684641.7500, grad_fn=<MseLossBackward>)
output :  tensor([[160847.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1815966.7500, grad_fn=<MseLossBackward>)
output :  tensor([[129403.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(816764.0625, grad_fn=<MseLossBackward>)
output :  tensor([[94222.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(604251.1875, grad_fn=<MseLossBackward>)
output :  tensor([[158284.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4442e+09, grad_fn=<MseLossBackward>)
output :  tensor([[177483.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(5837433.5000, grad_fn=<MseLossBackward>)
output :  tensor([[118794.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(2908783.5000, grad_fn=<MseLossBackward>)
output :  tensor([[188354.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6480e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146832.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5337e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151003.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1217608.7500, grad_fn=<MseLossBackward>)
output :  tensor([[189237.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2211959., grad_fn=<MseLossBackward>)
output :  tensor([[250996.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7708e+09, grad_fn=<MseLossBackward>)
output :  tensor([[91041.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(210279.5625, grad_fn=<MseLossBackward>)
output :  tensor([[238456.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2382922.7500, grad_fn=<MseLossBackward>)
output :  tensor([[127784.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(511627.2812, grad_fn=<MseLossBackward>)
output :  tensor([[166878.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(9.8053e+09, grad_fn=<MseLossBackward>)
output :  tensor([[115415.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3765e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178367.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(5604686.5000, grad_fn=<MseLossBackward>)
output :  tensor([[166777.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4953e+08, grad_fn=<MseLossBackward>)
output :  tensor([[157769.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4361e+08, grad_fn=<MseLossBackward>)
output :  tensor([[236904.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(4389352.5000, grad_fn=<MseLossBackward>)
output :  tensor([[228598.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(8.6448e+08, grad_fn=<MseLossBackward>)
output :  tensor([[126488.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(261648.2344, grad_fn=<MseLossBackward>)
output :  tensor([[129331.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(11096706., grad_fn=<MseLossBackward>)
output :  tensor([[223030.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(15758667., grad_fn=<MseLossBackward>)
output :  tensor([[230194.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(14480284., grad_fn=<MseLossBackward>)
output :  tensor([[228586.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(3557231.7500, grad_fn=<MseLossBackward>)
output :  tensor([[146482.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2302616.5000, grad_fn=<MseLossBackward>)
output :  tensor([[214641.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(21547438., grad_fn=<MseLossBackward>)
output :  tensor([[129381.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(88016504., grad_fn=<MseLossBackward>)
output :  tensor([[136385.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(15096260., grad_fn=<MseLossBackward>)
output :  tensor([[307530.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(55799500., grad_fn=<MseLossBackward>)
output :  tensor([[139110.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3569738., grad_fn=<MseLossBackward>)
output :  tensor([[119749.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7825e+09, grad_fn=<MseLossBackward>)
output :  tensor([[107600.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(3608723.5000, grad_fn=<MseLossBackward>)
output :  tensor([[155017.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0563e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178282.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(9.3011e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174491.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2225644.5000, grad_fn=<MseLossBackward>)
output :  tensor([[189722.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2718e+08, grad_fn=<MseLossBackward>)
output :  tensor([[104617.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(21323976., grad_fn=<MseLossBackward>)
output :  tensor([[180416.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2007269.1250, grad_fn=<MseLossBackward>)
output :  tensor([[168650.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(563836.7500, grad_fn=<MseLossBackward>)
output :  tensor([[142976.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(15813795., grad_fn=<MseLossBackward>)
output :  tensor([[257340.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0355e+10, grad_fn=<MseLossBackward>)
output :  tensor([[141319.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1719e+09, grad_fn=<MseLossBackward>)
output :  tensor([[172863.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(18559.8047, grad_fn=<MseLossBackward>)
output :  tensor([[140836.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(699889.1250, grad_fn=<MseLossBackward>)
output :  tensor([[200095.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(163329.6406, grad_fn=<MseLossBackward>)
output :  tensor([[168166.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3359946.2500, grad_fn=<MseLossBackward>)
output :  tensor([[240786.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(10329394., grad_fn=<MseLossBackward>)
output :  tensor([[134607.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(11479.1133, grad_fn=<MseLossBackward>)
output :  tensor([[151848.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(6240394.5000, grad_fn=<MseLossBackward>)
output :  tensor([[213806.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1425412.1250, grad_fn=<MseLossBackward>)
output :  tensor([[165675.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(456595.8438, grad_fn=<MseLossBackward>)
output :  tensor([[190126.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1268439., grad_fn=<MseLossBackward>)
output :  tensor([[134907.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8045e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130940.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(3763872.7500, grad_fn=<MseLossBackward>)
output :  tensor([[144732.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(22396260., grad_fn=<MseLossBackward>)
output :  tensor([[199214.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9400e+09, grad_fn=<MseLossBackward>)
output :  tensor([[165389.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5391e+09, grad_fn=<MseLossBackward>)
output :  tensor([[77031.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9005e+08, grad_fn=<MseLossBackward>)
output :  tensor([[93976.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(89812936., grad_fn=<MseLossBackward>)
output :  tensor([[254010.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(514985.6250, grad_fn=<MseLossBackward>)
output :  tensor([[206168.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5116e+09, grad_fn=<MseLossBackward>)
output :  tensor([[114420.1016]], grad_fn=<AddmmBackward>)
loss:  tensor(336282.1875, grad_fn=<MseLossBackward>)
output :  tensor([[157989.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7089e+08, grad_fn=<MseLossBackward>)
output :  tensor([[203540.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7092e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179876.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1223e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158286.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(10802623., grad_fn=<MseLossBackward>)
output :  tensor([[170271.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(73483.3516, grad_fn=<MseLossBackward>)
output :  tensor([[118370.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(11362377., grad_fn=<MseLossBackward>)
output :  tensor([[165090.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0183e+08, grad_fn=<MseLossBackward>)
output :  tensor([[193818.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7113e+08, grad_fn=<MseLossBackward>)
output :  tensor([[217740.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3095290.5000, grad_fn=<MseLossBackward>)
output :  tensor([[243647.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5135e+11, grad_fn=<MseLossBackward>)
output :  tensor([[148027.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1055306.7500, grad_fn=<MseLossBackward>)
output :  tensor([[109179.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(489967.1875, grad_fn=<MseLossBackward>)
output :  tensor([[173586.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(69110904., grad_fn=<MseLossBackward>)
output :  tensor([[150256.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(59094.5703, grad_fn=<MseLossBackward>)
output :  tensor([[237269.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(72756.6328, grad_fn=<MseLossBackward>)
output :  tensor([[113815.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(1402022.5000, grad_fn=<MseLossBackward>)
output :  tensor([[181019.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3537161.7500, grad_fn=<MseLossBackward>)
output :  tensor([[186676.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(531.8789, grad_fn=<MseLossBackward>)
output :  tensor([[165573.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3847e+10, grad_fn=<MseLossBackward>)
output :  tensor([[95101.4922]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9885e+08, grad_fn=<MseLossBackward>)
output :  tensor([[238819.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(32608.4590, grad_fn=<MseLossBackward>)
output :  tensor([[178409.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(5805088., grad_fn=<MseLossBackward>)
output :  tensor([[142577.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(6642539.5000, grad_fn=<MseLossBackward>)
output :  tensor([[234735.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(70067.7422, grad_fn=<MseLossBackward>)
output :  tensor([[163519.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(269993.9062, grad_fn=<MseLossBackward>)
output :  tensor([[202035.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5120e+10, grad_fn=<MseLossBackward>)
output :  tensor([[135986.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(973398.0625, grad_fn=<MseLossBackward>)
output :  tensor([[186721.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1116e+08, grad_fn=<MseLossBackward>)
output :  tensor([[138794.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(7809754., grad_fn=<MseLossBackward>)
output :  tensor([[223943.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4536e+08, grad_fn=<MseLossBackward>)
output :  tensor([[224337.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5855e+08, grad_fn=<MseLossBackward>)
output :  tensor([[88812.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(1409358.5000, grad_fn=<MseLossBackward>)
output :  tensor([[164034.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(21163018., grad_fn=<MseLossBackward>)
output :  tensor([[243914.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6120e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143795.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1450632., grad_fn=<MseLossBackward>)
output :  tensor([[110617.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9025e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164496.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(11.9241, grad_fn=<MseLossBackward>)
output :  tensor([[140669.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(11091294., grad_fn=<MseLossBackward>)
output :  tensor([[129466.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1603507.7500, grad_fn=<MseLossBackward>)
output :  tensor([[192717.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3933e+09, grad_fn=<MseLossBackward>)
output :  tensor([[123790.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(1664200.7500, grad_fn=<MseLossBackward>)
output :  tensor([[151501.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(248595.7344, grad_fn=<MseLossBackward>)
output :  tensor([[166826.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(24243776., grad_fn=<MseLossBackward>)
output :  tensor([[150939.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(3719.0940, grad_fn=<MseLossBackward>)
output :  tensor([[160139.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(7617859., grad_fn=<MseLossBackward>)
output :  tensor([[135786.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1751e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133894.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3590729., grad_fn=<MseLossBackward>)
output :  tensor([[157111.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2802e+08, grad_fn=<MseLossBackward>)
output :  tensor([[145833.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(2827389.7500, grad_fn=<MseLossBackward>)
output :  tensor([[161834.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(7195.8105, grad_fn=<MseLossBackward>)
output :  tensor([[140451.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(9.3338e+08, grad_fn=<MseLossBackward>)
output :  tensor([[149911.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1235154.3750, grad_fn=<MseLossBackward>)
output :  tensor([[186383.]], grad_fn=<AddmmBackward>)
loss:  tensor(2614689., grad_fn=<MseLossBackward>)
output :  tensor([[167443.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2422595., grad_fn=<MseLossBackward>)
output :  tensor([[181885.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(3553401.7500, grad_fn=<MseLossBackward>)
output :  tensor([[221537.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2365059.5000, grad_fn=<MseLossBackward>)
output :  tensor([[114562.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(44389116., grad_fn=<MseLossBackward>)
output :  tensor([[137847.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6763e+08, grad_fn=<MseLossBackward>)
output :  tensor([[288526.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(6385255., grad_fn=<MseLossBackward>)
output :  tensor([[117869.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3496374., grad_fn=<MseLossBackward>)
output :  tensor([[175706.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9619e+09, grad_fn=<MseLossBackward>)
output :  tensor([[185438.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(192309.6562, grad_fn=<MseLossBackward>)
output :  tensor([[176838.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(75017520., grad_fn=<MseLossBackward>)
output :  tensor([[252094.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2464e+08, grad_fn=<MseLossBackward>)
output :  tensor([[222173.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(30037.2227, grad_fn=<MseLossBackward>)
output :  tensor([[133115.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4067e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177920.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2105e+08, grad_fn=<MseLossBackward>)
output :  tensor([[125592.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(2535484., grad_fn=<MseLossBackward>)
output :  tensor([[181622.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6130e+10, grad_fn=<MseLossBackward>)
output :  tensor([[150356.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(6988588., grad_fn=<MseLossBackward>)
output :  tensor([[157703.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2553e+08, grad_fn=<MseLossBackward>)
output :  tensor([[206195.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(10995.4883, grad_fn=<MseLossBackward>)
output :  tensor([[145171.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6056e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176599.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(358894.5938, grad_fn=<MseLossBackward>)
output :  tensor([[245764.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1381e+09, grad_fn=<MseLossBackward>)
output :  tensor([[148116.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(13572.2500, grad_fn=<MseLossBackward>)
output :  tensor([[200702.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3850670.2500, grad_fn=<MseLossBackward>)
output :  tensor([[165898.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(35386884., grad_fn=<MseLossBackward>)
output :  tensor([[125320.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3928e+09, grad_fn=<MseLossBackward>)
output :  tensor([[133030.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(7395255.5000, grad_fn=<MseLossBackward>)
output :  tensor([[185756.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3085182.5000, grad_fn=<MseLossBackward>)
output :  tensor([[192772.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(7688142.5000, grad_fn=<MseLossBackward>)
output :  tensor([[216683.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2296e+09, grad_fn=<MseLossBackward>)
output :  tensor([[260017.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(9105966., grad_fn=<MseLossBackward>)
output :  tensor([[179933.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9340e+10, grad_fn=<MseLossBackward>)
output :  tensor([[146401.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0141e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136488.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(64190392., grad_fn=<MseLossBackward>)
output :  tensor([[74956.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2219e+09, grad_fn=<MseLossBackward>)
output :  tensor([[142592.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(57649616., grad_fn=<MseLossBackward>)
output :  tensor([[128076.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(678087.9375, grad_fn=<MseLossBackward>)
output :  tensor([[156449.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(6000586., grad_fn=<MseLossBackward>)
output :  tensor([[132173.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(26769630., grad_fn=<MseLossBackward>)
output :  tensor([[77146.4922]], grad_fn=<AddmmBackward>)
loss:  tensor(417952.1562, grad_fn=<MseLossBackward>)
output :  tensor([[81464.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(286542.7500, grad_fn=<MseLossBackward>)
output :  tensor([[231067.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(869323.1250, grad_fn=<MseLossBackward>)
output :  tensor([[142135.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7824e+08, grad_fn=<MseLossBackward>)
output :  tensor([[132349.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3420534.7500, grad_fn=<MseLossBackward>)
output :  tensor([[169788.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(7777213.5000, grad_fn=<MseLossBackward>)
output :  tensor([[233866.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1284999.3750, grad_fn=<MseLossBackward>)
output :  tensor([[187697.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(19734140., grad_fn=<MseLossBackward>)
output :  tensor([[155429.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(325595.0625, grad_fn=<MseLossBackward>)
output :  tensor([[201832.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(15464925., grad_fn=<MseLossBackward>)
output :  tensor([[195020.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7622e+09, grad_fn=<MseLossBackward>)
output :  tensor([[134722.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(5186579., grad_fn=<MseLossBackward>)
output :  tensor([[155861.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(741590.0625, grad_fn=<MseLossBackward>)
output :  tensor([[135908.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(8329.4141, grad_fn=<MseLossBackward>)
output :  tensor([[193964.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2986e+09, grad_fn=<MseLossBackward>)
output :  tensor([[155546.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(2390550.7500, grad_fn=<MseLossBackward>)
output :  tensor([[141456.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2998e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145823.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(852332.8750, grad_fn=<MseLossBackward>)
output :  tensor([[206641.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(28715532., grad_fn=<MseLossBackward>)
output :  tensor([[108771.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1672e+08, grad_fn=<MseLossBackward>)
output :  tensor([[167115.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(147660.0781, grad_fn=<MseLossBackward>)
output :  tensor([[127455.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(296505.7812, grad_fn=<MseLossBackward>)
output :  tensor([[146008.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(983754., grad_fn=<MseLossBackward>)
output :  tensor([[108607.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1367e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137327.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(29627.0156, grad_fn=<MseLossBackward>)
output :  tensor([[239482.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(12129439., grad_fn=<MseLossBackward>)
output :  tensor([[145962.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(926707.0625, grad_fn=<MseLossBackward>)
output :  tensor([[139992.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(6212089., grad_fn=<MseLossBackward>)
output :  tensor([[165226.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3858e+09, grad_fn=<MseLossBackward>)
output :  tensor([[262533.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3923e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177373.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(5633502., grad_fn=<MseLossBackward>)
output :  tensor([[104427.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(2725826.7500, grad_fn=<MseLossBackward>)
output :  tensor([[200025.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0023e+09, grad_fn=<MseLossBackward>)
output :  tensor([[160511.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2284490.5000, grad_fn=<MseLossBackward>)
output :  tensor([[159419.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7527e+10, grad_fn=<MseLossBackward>)
output :  tensor([[100382.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(4337782.5000, grad_fn=<MseLossBackward>)
output :  tensor([[122780.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(671068.1875, grad_fn=<MseLossBackward>)
output :  tensor([[156450.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(202950.2500, grad_fn=<MseLossBackward>)
output :  tensor([[138481.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2305320.2500, grad_fn=<MseLossBackward>)
output :  tensor([[197991.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(4034009.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138746.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(10585872., grad_fn=<MseLossBackward>)
output :  tensor([[257779.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(20251968., grad_fn=<MseLossBackward>)
output :  tensor([[129330.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3199e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164521.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(957676.3125, grad_fn=<MseLossBackward>)
output :  tensor([[189293.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(630063.8750, grad_fn=<MseLossBackward>)
output :  tensor([[125772.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4878e+08, grad_fn=<MseLossBackward>)
output :  tensor([[249232.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(588984.3125, grad_fn=<MseLossBackward>)
output :  tensor([[155357.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0013e+09, grad_fn=<MseLossBackward>)
output :  tensor([[242817.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(6415851.5000, grad_fn=<MseLossBackward>)
output :  tensor([[142312.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2849133., grad_fn=<MseLossBackward>)
output :  tensor([[206876.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(9757814., grad_fn=<MseLossBackward>)
output :  tensor([[174196.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(3228366.7500, grad_fn=<MseLossBackward>)
output :  tensor([[156278.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(5192132., grad_fn=<MseLossBackward>)
output :  tensor([[116602.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(1952897.1250, grad_fn=<MseLossBackward>)
output :  tensor([[233177.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9066e+09, grad_fn=<MseLossBackward>)
output :  tensor([[237513.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(6181439., grad_fn=<MseLossBackward>)
output :  tensor([[148717.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(21342234., grad_fn=<MseLossBackward>)
output :  tensor([[255279.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(144305.0156, grad_fn=<MseLossBackward>)
output :  tensor([[122795.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(68746512., grad_fn=<MseLossBackward>)
output :  tensor([[179615.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(13070033., grad_fn=<MseLossBackward>)
output :  tensor([[164922.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(24235006., grad_fn=<MseLossBackward>)
output :  tensor([[136934.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(35218660., grad_fn=<MseLossBackward>)
output :  tensor([[197277.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5938e+09, grad_fn=<MseLossBackward>)
output :  tensor([[160768.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(10441179., grad_fn=<MseLossBackward>)
output :  tensor([[163134.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(18065.0391, grad_fn=<MseLossBackward>)
output :  tensor([[157768.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(53519.9297, grad_fn=<MseLossBackward>)
output :  tensor([[152911.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(9066215., grad_fn=<MseLossBackward>)
output :  tensor([[176245.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4550e+09, grad_fn=<MseLossBackward>)
output :  tensor([[162380.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(5668194., grad_fn=<MseLossBackward>)
output :  tensor([[372485.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3191e+08, grad_fn=<MseLossBackward>)
output :  tensor([[126685.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(99146.2656, grad_fn=<MseLossBackward>)
output :  tensor([[129933.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9744e+09, grad_fn=<MseLossBackward>)
output :  tensor([[281596.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(146976.3906, grad_fn=<MseLossBackward>)
output :  tensor([[164054.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(4221805., grad_fn=<MseLossBackward>)
output :  tensor([[131709.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2565e+08, grad_fn=<MseLossBackward>)
output :  tensor([[240079.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(65273776., grad_fn=<MseLossBackward>)
output :  tensor([[183172.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(7141003.5000, grad_fn=<MseLossBackward>)
output :  tensor([[153784.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(3182879., grad_fn=<MseLossBackward>)
output :  tensor([[145501.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(251815.7812, grad_fn=<MseLossBackward>)
output :  tensor([[156439.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8178e+08, grad_fn=<MseLossBackward>)
output :  tensor([[103089.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(9547279., grad_fn=<MseLossBackward>)
output :  tensor([[82513.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0686e+08, grad_fn=<MseLossBackward>)
output :  tensor([[162464.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(6431058.5000, grad_fn=<MseLossBackward>)
output :  tensor([[186861.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6924e+09, grad_fn=<MseLossBackward>)
output :  tensor([[160913.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(8486206., grad_fn=<MseLossBackward>)
output :  tensor([[166056.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(73208608., grad_fn=<MseLossBackward>)
output :  tensor([[137567.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(13787.8965, grad_fn=<MseLossBackward>)
output :  tensor([[204352.]], grad_fn=<AddmmBackward>)
loss:  tensor(2553604., grad_fn=<MseLossBackward>)
output :  tensor([[138735.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(540776.3750, grad_fn=<MseLossBackward>)
output :  tensor([[181364.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6547e+10, grad_fn=<MseLossBackward>)
output :  tensor([[147065.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1134391.3750, grad_fn=<MseLossBackward>)
output :  tensor([[112028.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4265e+08, grad_fn=<MseLossBackward>)
output :  tensor([[94573.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(329054.5938, grad_fn=<MseLossBackward>)
output :  tensor([[176221.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1493131.2500, grad_fn=<MseLossBackward>)
output :  tensor([[259582.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(667744.3125, grad_fn=<MseLossBackward>)
output :  tensor([[142717.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1482762.8750, grad_fn=<MseLossBackward>)
output :  tensor([[158891.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1007890.5000, grad_fn=<MseLossBackward>)
output :  tensor([[132167.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(110390.0625, grad_fn=<MseLossBackward>)
output :  tensor([[146126.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(11380502., grad_fn=<MseLossBackward>)
output :  tensor([[169396.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2240494.5000, grad_fn=<MseLossBackward>)
output :  tensor([[125861.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(1296805., grad_fn=<MseLossBackward>)
output :  tensor([[175784.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(9.4768e+08, grad_fn=<MseLossBackward>)
output :  tensor([[156541.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(209993.0625, grad_fn=<MseLossBackward>)
output :  tensor([[113769.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(7454563.5000, grad_fn=<MseLossBackward>)
output :  tensor([[161353.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1333e+09, grad_fn=<MseLossBackward>)
output :  tensor([[53776.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(3157562.5000, grad_fn=<MseLossBackward>)
output :  tensor([[231530.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5560e+09, grad_fn=<MseLossBackward>)
output :  tensor([[199946.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1110389., grad_fn=<MseLossBackward>)
output :  tensor([[184539.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(212391.3594, grad_fn=<MseLossBackward>)
output :  tensor([[104527.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(2169614., grad_fn=<MseLossBackward>)
output :  tensor([[88633.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(2668654., grad_fn=<MseLossBackward>)
output :  tensor([[141800.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(3242081.5000, grad_fn=<MseLossBackward>)
output :  tensor([[217389.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8692e+09, grad_fn=<MseLossBackward>)
output :  tensor([[200870.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(43952340., grad_fn=<MseLossBackward>)
output :  tensor([[162400.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(6757075.5000, grad_fn=<MseLossBackward>)
output :  tensor([[170670.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8981e+09, grad_fn=<MseLossBackward>)
output :  tensor([[189942.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(3356.7539, grad_fn=<MseLossBackward>)
output :  tensor([[89224.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(4946662.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139660.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(115132.9688, grad_fn=<MseLossBackward>)
output :  tensor([[109947.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(305688.0312, grad_fn=<MseLossBackward>)
output :  tensor([[146785.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1719e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173469.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8037e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193390.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3479e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179822.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(31456.3477, grad_fn=<MseLossBackward>)
output :  tensor([[97742.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1543495.6250, grad_fn=<MseLossBackward>)
output :  tensor([[117681.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(32885.5547, grad_fn=<MseLossBackward>)
output :  tensor([[159734.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8883e+08, grad_fn=<MseLossBackward>)
output :  tensor([[199904.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(9129.2051, grad_fn=<MseLossBackward>)
output :  tensor([[145001.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1003690.8750, grad_fn=<MseLossBackward>)
train_loss: [2.6744128e+09]
epoch_result tensor([0.])
output :  tensor([[158507.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(58.1406, grad_fn=<MseLossBackward>)
output :  tensor([[123365.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1865187.7500, grad_fn=<MseLossBackward>)
output :  tensor([[196157.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(3826608.5000, grad_fn=<MseLossBackward>)
output :  tensor([[178222.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1494773.6250, grad_fn=<MseLossBackward>)
output :  tensor([[153663.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9225e+08, grad_fn=<MseLossBackward>)
output :  tensor([[132216.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(17780718., grad_fn=<MseLossBackward>)
output :  tensor([[141074.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(5601.5869, grad_fn=<MseLossBackward>)
output :  tensor([[120626.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2644638.2500, grad_fn=<MseLossBackward>)
output :  tensor([[71665.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7332e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165210.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(622742.9375, grad_fn=<MseLossBackward>)
output :  tensor([[140735.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(541213.1250, grad_fn=<MseLossBackward>)
output :  tensor([[226211.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1466899.5000, grad_fn=<MseLossBackward>)
output :  tensor([[167979.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1041866.7500, grad_fn=<MseLossBackward>)
output :  tensor([[248835.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(747279.1875, grad_fn=<MseLossBackward>)
output :  tensor([[58560.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(12675102., grad_fn=<MseLossBackward>)
output :  tensor([[164516.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0065e+08, grad_fn=<MseLossBackward>)
output :  tensor([[164370.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1298e+08, grad_fn=<MseLossBackward>)
output :  tensor([[162944.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(41537624., grad_fn=<MseLossBackward>)
output :  tensor([[274306.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(480682.2188, grad_fn=<MseLossBackward>)
output :  tensor([[196249.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(563391., grad_fn=<MseLossBackward>)
output :  tensor([[138252.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5212e+10, grad_fn=<MseLossBackward>)
output :  tensor([[196051.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(4719756., grad_fn=<MseLossBackward>)
output :  tensor([[180114.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0057e+09, grad_fn=<MseLossBackward>)
output :  tensor([[152002.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1004348.4375, grad_fn=<MseLossBackward>)
output :  tensor([[172856.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(8157628.5000, grad_fn=<MseLossBackward>)
output :  tensor([[86552.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1327896.1250, grad_fn=<MseLossBackward>)
output :  tensor([[169598.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2034e+09, grad_fn=<MseLossBackward>)
output :  tensor([[185115.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(13347.4697, grad_fn=<MseLossBackward>)
output :  tensor([[203824.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6703e+09, grad_fn=<MseLossBackward>)
output :  tensor([[110109.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(12043.3477, grad_fn=<MseLossBackward>)
output :  tensor([[174264.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(10656042., grad_fn=<MseLossBackward>)
output :  tensor([[139873.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(11382189., grad_fn=<MseLossBackward>)
output :  tensor([[127429.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2466323., grad_fn=<MseLossBackward>)
output :  tensor([[120245.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(556131.4375, grad_fn=<MseLossBackward>)
output :  tensor([[147452.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2733e+08, grad_fn=<MseLossBackward>)
output :  tensor([[169351.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1213e+10, grad_fn=<MseLossBackward>)
output :  tensor([[152086.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(5696277., grad_fn=<MseLossBackward>)
output :  tensor([[180591.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(349576.5625, grad_fn=<MseLossBackward>)
output :  tensor([[143068.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(4278369., grad_fn=<MseLossBackward>)
output :  tensor([[106758.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8086e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136721.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1276e+09, grad_fn=<MseLossBackward>)
output :  tensor([[139976.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(24760888., grad_fn=<MseLossBackward>)
output :  tensor([[138466.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3149e+08, grad_fn=<MseLossBackward>)
output :  tensor([[223607.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1939839.6250, grad_fn=<MseLossBackward>)
output :  tensor([[130596.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(2734398.2500, grad_fn=<MseLossBackward>)
output :  tensor([[148044.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(912502.5625, grad_fn=<MseLossBackward>)
output :  tensor([[111638.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(130445.1250, grad_fn=<MseLossBackward>)
output :  tensor([[160766.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(586899.6250, grad_fn=<MseLossBackward>)
output :  tensor([[147304.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2748e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193263.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1597064., grad_fn=<MseLossBackward>)
output :  tensor([[136118.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2784465.7500, grad_fn=<MseLossBackward>)
output :  tensor([[109052.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(897252.9375, grad_fn=<MseLossBackward>)
output :  tensor([[233882.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(13850.3477, grad_fn=<MseLossBackward>)
output :  tensor([[164503.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3997e+09, grad_fn=<MseLossBackward>)
output :  tensor([[155657.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(11170008., grad_fn=<MseLossBackward>)
output :  tensor([[203070.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8706e+10, grad_fn=<MseLossBackward>)
output :  tensor([[240389.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2907e+10, grad_fn=<MseLossBackward>)
output :  tensor([[142808.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(478842.3750, grad_fn=<MseLossBackward>)
output :  tensor([[133497.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(252098.1406, grad_fn=<MseLossBackward>)
output :  tensor([[154841.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(25166.8477, grad_fn=<MseLossBackward>)
output :  tensor([[132165.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(4689187., grad_fn=<MseLossBackward>)
output :  tensor([[183569.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8416e+09, grad_fn=<MseLossBackward>)
output :  tensor([[182584.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2297687.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162184.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(468732.7812, grad_fn=<MseLossBackward>)
output :  tensor([[129174.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9116e+08, grad_fn=<MseLossBackward>)
output :  tensor([[145987.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(12163855., grad_fn=<MseLossBackward>)
output :  tensor([[148507.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(12301460., grad_fn=<MseLossBackward>)
output :  tensor([[171838.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6032e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193209.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6597e+08, grad_fn=<MseLossBackward>)
output :  tensor([[138727.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(4963148.5000, grad_fn=<MseLossBackward>)
output :  tensor([[168813.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(9523975., grad_fn=<MseLossBackward>)
output :  tensor([[174937.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(36752392., grad_fn=<MseLossBackward>)
output :  tensor([[119026.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(16216540., grad_fn=<MseLossBackward>)
output :  tensor([[217770.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(10426542., grad_fn=<MseLossBackward>)
output :  tensor([[181627.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3504910.5000, grad_fn=<MseLossBackward>)
output :  tensor([[126707.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1458056.2500, grad_fn=<MseLossBackward>)
output :  tensor([[198870.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(5617566.5000, grad_fn=<MseLossBackward>)
output :  tensor([[177323.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(5874034., grad_fn=<MseLossBackward>)
output :  tensor([[202225.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3865e+10, grad_fn=<MseLossBackward>)
output :  tensor([[210434.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(319684.2188, grad_fn=<MseLossBackward>)
output :  tensor([[170748.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5799e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192789.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2924420.7500, grad_fn=<MseLossBackward>)
output :  tensor([[113829.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(687966.5625, grad_fn=<MseLossBackward>)
output :  tensor([[114233.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(3005970.2500, grad_fn=<MseLossBackward>)
output :  tensor([[113092.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(1193607.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145778.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1042951.5625, grad_fn=<MseLossBackward>)
output :  tensor([[157623.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4232e+10, grad_fn=<MseLossBackward>)
output :  tensor([[180263.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(69679.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128628.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(1272859.8750, grad_fn=<MseLossBackward>)
output :  tensor([[145697.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(486985.9062, grad_fn=<MseLossBackward>)
output :  tensor([[186218.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6336e+09, grad_fn=<MseLossBackward>)
output :  tensor([[118544.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(2705588., grad_fn=<MseLossBackward>)
output :  tensor([[194681.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(5376167., grad_fn=<MseLossBackward>)
output :  tensor([[144149.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(723217.3750, grad_fn=<MseLossBackward>)
output :  tensor([[213292.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(153909.0938, grad_fn=<MseLossBackward>)
output :  tensor([[128409.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(5803431.5000, grad_fn=<MseLossBackward>)
output :  tensor([[244881.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(11880409., grad_fn=<MseLossBackward>)
output :  tensor([[235674.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4330e+09, grad_fn=<MseLossBackward>)
output :  tensor([[153302.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7970e+08, grad_fn=<MseLossBackward>)
output :  tensor([[84955.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7385e+08, grad_fn=<MseLossBackward>)
output :  tensor([[190935.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0500e+09, grad_fn=<MseLossBackward>)
output :  tensor([[81374.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(140297.0625, grad_fn=<MseLossBackward>)
output :  tensor([[141915.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(5835546., grad_fn=<MseLossBackward>)
output :  tensor([[75461.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(1505.8037, grad_fn=<MseLossBackward>)
output :  tensor([[142171.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(611084.1875, grad_fn=<MseLossBackward>)
output :  tensor([[176046.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2179.7227, grad_fn=<MseLossBackward>)
output :  tensor([[153327.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(29885.7656, grad_fn=<MseLossBackward>)
output :  tensor([[105334.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(4264773.5000, grad_fn=<MseLossBackward>)
output :  tensor([[200710.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3234e+10, grad_fn=<MseLossBackward>)
output :  tensor([[128473.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(702.2500, grad_fn=<MseLossBackward>)
output :  tensor([[262796.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9594e+08, grad_fn=<MseLossBackward>)
output :  tensor([[310056.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(3227.6602, grad_fn=<MseLossBackward>)
output :  tensor([[110208.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(7333898.5000, grad_fn=<MseLossBackward>)
output :  tensor([[169849.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(7026724., grad_fn=<MseLossBackward>)
output :  tensor([[134311.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9231e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130665.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(69455688., grad_fn=<MseLossBackward>)
output :  tensor([[132620.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(5620678., grad_fn=<MseLossBackward>)
output :  tensor([[130381.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(28963822., grad_fn=<MseLossBackward>)
output :  tensor([[137578.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8839e+08, grad_fn=<MseLossBackward>)
output :  tensor([[226112.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8765e+10, grad_fn=<MseLossBackward>)
output :  tensor([[186255.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3946e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145555.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2741611.5000, grad_fn=<MseLossBackward>)
output :  tensor([[130457.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(8749625., grad_fn=<MseLossBackward>)
output :  tensor([[113408.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(4657267.5000, grad_fn=<MseLossBackward>)
output :  tensor([[253897.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1170e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136031.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1064411.3750, grad_fn=<MseLossBackward>)
output :  tensor([[205040.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(4163321.5000, grad_fn=<MseLossBackward>)
output :  tensor([[97056.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(61523432., grad_fn=<MseLossBackward>)
output :  tensor([[139908.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1748.2852, grad_fn=<MseLossBackward>)
output :  tensor([[204274.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0906e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181697.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(3231792.7500, grad_fn=<MseLossBackward>)
output :  tensor([[186032.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1066637.1250, grad_fn=<MseLossBackward>)
output :  tensor([[163647.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1127e+10, grad_fn=<MseLossBackward>)
output :  tensor([[289746.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0479e+09, grad_fn=<MseLossBackward>)
output :  tensor([[197540.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(129071.7891, grad_fn=<MseLossBackward>)
output :  tensor([[258104.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0954e+10, grad_fn=<MseLossBackward>)
output :  tensor([[215698.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5303e+09, grad_fn=<MseLossBackward>)
output :  tensor([[275617.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7125e+09, grad_fn=<MseLossBackward>)
output :  tensor([[222561.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2068203.5000, grad_fn=<MseLossBackward>)
output :  tensor([[222107.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8864e+10, grad_fn=<MseLossBackward>)
output :  tensor([[195631.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1873562.1250, grad_fn=<MseLossBackward>)
output :  tensor([[159625.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(9.3791e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133115.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(378571.0312, grad_fn=<MseLossBackward>)
output :  tensor([[133365.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(4557891.5000, grad_fn=<MseLossBackward>)
output :  tensor([[89903.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(1201404.3750, grad_fn=<MseLossBackward>)
output :  tensor([[108647.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(419691.4062, grad_fn=<MseLossBackward>)
output :  tensor([[271308.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3168e+09, grad_fn=<MseLossBackward>)
output :  tensor([[232147.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(8138628.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144488.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(261648.2344, grad_fn=<MseLossBackward>)
output :  tensor([[135582.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3675188.5000, grad_fn=<MseLossBackward>)
output :  tensor([[171213.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(6346305.5000, grad_fn=<MseLossBackward>)
output :  tensor([[147901.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(7030369.5000, grad_fn=<MseLossBackward>)
output :  tensor([[165081.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(8.6546e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165128.]], grad_fn=<AddmmBackward>)
loss:  tensor(16384., grad_fn=<MseLossBackward>)
output :  tensor([[138198.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1437338.7500, grad_fn=<MseLossBackward>)
output :  tensor([[188621.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3721e+09, grad_fn=<MseLossBackward>)
output :  tensor([[114266.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(5136703.5000, grad_fn=<MseLossBackward>)
output :  tensor([[170483.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2299345.7500, grad_fn=<MseLossBackward>)
output :  tensor([[124181.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(17488340., grad_fn=<MseLossBackward>)
output :  tensor([[83949.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(9306313., grad_fn=<MseLossBackward>)
output :  tensor([[179626.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(139338.8906, grad_fn=<MseLossBackward>)
output :  tensor([[109817.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(6785.6406, grad_fn=<MseLossBackward>)
output :  tensor([[230127.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(78715160., grad_fn=<MseLossBackward>)
output :  tensor([[242380.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(6863909., grad_fn=<MseLossBackward>)
output :  tensor([[129530.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(946.5237, grad_fn=<MseLossBackward>)
output :  tensor([[109417.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(209964.4219, grad_fn=<MseLossBackward>)
output :  tensor([[287159.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2498e+10, grad_fn=<MseLossBackward>)
output :  tensor([[171896.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(157150.2969, grad_fn=<MseLossBackward>)
output :  tensor([[127821.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(7963551.5000, grad_fn=<MseLossBackward>)
output :  tensor([[146680.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2256e+08, grad_fn=<MseLossBackward>)
output :  tensor([[199587.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0773e+08, grad_fn=<MseLossBackward>)
output :  tensor([[143788.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(7777301., grad_fn=<MseLossBackward>)
output :  tensor([[157484.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5010e+10, grad_fn=<MseLossBackward>)
output :  tensor([[157483.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(12841472., grad_fn=<MseLossBackward>)
output :  tensor([[131780.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(5202889.5000, grad_fn=<MseLossBackward>)
output :  tensor([[243469.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8233e+10, grad_fn=<MseLossBackward>)
output :  tensor([[396988.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(25116386., grad_fn=<MseLossBackward>)
output :  tensor([[116105.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(50488684., grad_fn=<MseLossBackward>)
output :  tensor([[123034.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(20565516., grad_fn=<MseLossBackward>)
output :  tensor([[159014.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(235452.4062, grad_fn=<MseLossBackward>)
output :  tensor([[132847.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4744e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165047.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2436e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174169.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1177e+09, grad_fn=<MseLossBackward>)
output :  tensor([[104556.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(914967., grad_fn=<MseLossBackward>)
output :  tensor([[140281.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(515725.9688, grad_fn=<MseLossBackward>)
output :  tensor([[361504.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(33517586., grad_fn=<MseLossBackward>)
output :  tensor([[200577.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8540e+09, grad_fn=<MseLossBackward>)
output :  tensor([[177045.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2390067.7500, grad_fn=<MseLossBackward>)
output :  tensor([[201806.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1195605.6250, grad_fn=<MseLossBackward>)
output :  tensor([[141031.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(4126865.2500, grad_fn=<MseLossBackward>)
output :  tensor([[191580.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(8524119., grad_fn=<MseLossBackward>)
output :  tensor([[137949.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2714e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179561.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2069282.2500, grad_fn=<MseLossBackward>)
output :  tensor([[240955.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1090066.5000, grad_fn=<MseLossBackward>)
output :  tensor([[175078.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1163431.8750, grad_fn=<MseLossBackward>)
output :  tensor([[112299.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(18483080., grad_fn=<MseLossBackward>)
output :  tensor([[263972.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(346736.9688, grad_fn=<MseLossBackward>)
output :  tensor([[250018.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(333.0625, grad_fn=<MseLossBackward>)
output :  tensor([[121889.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(1233366.3750, grad_fn=<MseLossBackward>)
output :  tensor([[215332.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5602e+09, grad_fn=<MseLossBackward>)
output :  tensor([[302090.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3868e+08, grad_fn=<MseLossBackward>)
output :  tensor([[205672.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1761800., grad_fn=<MseLossBackward>)
output :  tensor([[212309.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6305e+10, grad_fn=<MseLossBackward>)
output :  tensor([[160298.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(5751603., grad_fn=<MseLossBackward>)
output :  tensor([[168840.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1321062.8750, grad_fn=<MseLossBackward>)
output :  tensor([[159157.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(4953128.5000, grad_fn=<MseLossBackward>)
output :  tensor([[170327.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(107133.4688, grad_fn=<MseLossBackward>)
output :  tensor([[233686.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1774e+09, grad_fn=<MseLossBackward>)
output :  tensor([[211658.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1675e+08, grad_fn=<MseLossBackward>)
output :  tensor([[161247.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0299e+08, grad_fn=<MseLossBackward>)
output :  tensor([[122335.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(441726.3750, grad_fn=<MseLossBackward>)
output :  tensor([[176381.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(382928.9062, grad_fn=<MseLossBackward>)
output :  tensor([[179845.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4247e+09, grad_fn=<MseLossBackward>)
output :  tensor([[203183.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6647e+10, grad_fn=<MseLossBackward>)
output :  tensor([[136241.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(3274686., grad_fn=<MseLossBackward>)
output :  tensor([[152951.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(9.8289e+08, grad_fn=<MseLossBackward>)
output :  tensor([[272204.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(22999218., grad_fn=<MseLossBackward>)
output :  tensor([[87124.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(4511641.5000, grad_fn=<MseLossBackward>)
output :  tensor([[234122.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(5651540.5000, grad_fn=<MseLossBackward>)
output :  tensor([[258983.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0494e+11, grad_fn=<MseLossBackward>)
output :  tensor([[171044.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1091959.7500, grad_fn=<MseLossBackward>)
output :  tensor([[190494.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9807e+09, grad_fn=<MseLossBackward>)
output :  tensor([[153189.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(3279664.5000, grad_fn=<MseLossBackward>)
output :  tensor([[206814.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9924e+09, grad_fn=<MseLossBackward>)
output :  tensor([[130326.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(1760037.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145522.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(272500.3125, grad_fn=<MseLossBackward>)
output :  tensor([[169139.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0968e+08, grad_fn=<MseLossBackward>)
output :  tensor([[186768.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(843929.3125, grad_fn=<MseLossBackward>)
output :  tensor([[126733.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(537380.6250, grad_fn=<MseLossBackward>)
output :  tensor([[136928.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(183197.3750, grad_fn=<MseLossBackward>)
output :  tensor([[176968.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(15748248., grad_fn=<MseLossBackward>)
output :  tensor([[198713.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6303e+09, grad_fn=<MseLossBackward>)
output :  tensor([[241090.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(3647145., grad_fn=<MseLossBackward>)
output :  tensor([[154081.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(843785.7500, grad_fn=<MseLossBackward>)
output :  tensor([[199109.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(9668796., grad_fn=<MseLossBackward>)
output :  tensor([[164261.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1055e+08, grad_fn=<MseLossBackward>)
output :  tensor([[194882.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3662e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179473.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(182088.8906, grad_fn=<MseLossBackward>)
output :  tensor([[99022.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(4089337., grad_fn=<MseLossBackward>)
output :  tensor([[172551.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1545e+10, grad_fn=<MseLossBackward>)
output :  tensor([[135671.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(450345.8438, grad_fn=<MseLossBackward>)
output :  tensor([[121751.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(45578216., grad_fn=<MseLossBackward>)
output :  tensor([[173039.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(922890.4375, grad_fn=<MseLossBackward>)
output :  tensor([[88398.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(11549431., grad_fn=<MseLossBackward>)
output :  tensor([[293715.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(13803083., grad_fn=<MseLossBackward>)
output :  tensor([[165702.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(493659.9375, grad_fn=<MseLossBackward>)
output :  tensor([[190487.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0358e+10, grad_fn=<MseLossBackward>)
output :  tensor([[241248.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8517e+08, grad_fn=<MseLossBackward>)
output :  tensor([[154212.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(10317747., grad_fn=<MseLossBackward>)
output :  tensor([[126051.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(4208107.5000, grad_fn=<MseLossBackward>)
output :  tensor([[114715.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(26874586., grad_fn=<MseLossBackward>)
output :  tensor([[146437.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(9.8834e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172269.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2995495.5000, grad_fn=<MseLossBackward>)
output :  tensor([[113739.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(9.7588e+08, grad_fn=<MseLossBackward>)
output :  tensor([[205122.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2741e+10, grad_fn=<MseLossBackward>)
output :  tensor([[236250.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(27558890., grad_fn=<MseLossBackward>)
output :  tensor([[247784.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1729e+10, grad_fn=<MseLossBackward>)
output :  tensor([[221983.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8956e+08, grad_fn=<MseLossBackward>)
output :  tensor([[194737.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4584e+10, grad_fn=<MseLossBackward>)
output :  tensor([[188930.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2046419.6250, grad_fn=<MseLossBackward>)
output :  tensor([[206844.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7535e+10, grad_fn=<MseLossBackward>)
output :  tensor([[187825.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1956e+10, grad_fn=<MseLossBackward>)
output :  tensor([[180504.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(3112578., grad_fn=<MseLossBackward>)
output :  tensor([[150555.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2085587.2500, grad_fn=<MseLossBackward>)
output :  tensor([[330781.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(38666632., grad_fn=<MseLossBackward>)
output :  tensor([[210106.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3585460.5000, grad_fn=<MseLossBackward>)
output :  tensor([[160845.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(715055.1875, grad_fn=<MseLossBackward>)
output :  tensor([[184908.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2026e+09, grad_fn=<MseLossBackward>)
output :  tensor([[107201.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(4847118., grad_fn=<MseLossBackward>)
output :  tensor([[266814.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3051e+10, grad_fn=<MseLossBackward>)
output :  tensor([[171136.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(7638055., grad_fn=<MseLossBackward>)
output :  tensor([[213226.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(74759.5234, grad_fn=<MseLossBackward>)
output :  tensor([[203059.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2186e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179153.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2194.3369, grad_fn=<MseLossBackward>)
output :  tensor([[200505.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1676903.6250, grad_fn=<MseLossBackward>)
output :  tensor([[155622.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(387350.6250, grad_fn=<MseLossBackward>)
output :  tensor([[151533.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6557e+09, grad_fn=<MseLossBackward>)
output :  tensor([[118099.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(160631.8750, grad_fn=<MseLossBackward>)
output :  tensor([[139496.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(253402.1250, grad_fn=<MseLossBackward>)
output :  tensor([[149127.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(16188.5859, grad_fn=<MseLossBackward>)
output :  tensor([[200498.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6257e+10, grad_fn=<MseLossBackward>)
output :  tensor([[162700.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(10244400., grad_fn=<MseLossBackward>)
output :  tensor([[103356.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(14876389., grad_fn=<MseLossBackward>)
output :  tensor([[224448.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4186e+08, grad_fn=<MseLossBackward>)
output :  tensor([[188681.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3737e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179529.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(9269266., grad_fn=<MseLossBackward>)
output :  tensor([[84578.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(6647494., grad_fn=<MseLossBackward>)
output :  tensor([[130659.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(4663980., grad_fn=<MseLossBackward>)
output :  tensor([[213130.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(756682.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144587.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(345560.2812, grad_fn=<MseLossBackward>)
output :  tensor([[135306.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(28161264., grad_fn=<MseLossBackward>)
output :  tensor([[143639.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1080950.1250, grad_fn=<MseLossBackward>)
output :  tensor([[179657.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7773e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144966.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(933850.4375, grad_fn=<MseLossBackward>)
output :  tensor([[160169.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(28682.5977, grad_fn=<MseLossBackward>)
output :  tensor([[213109.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3574108.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138573.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1272e+09, grad_fn=<MseLossBackward>)
output :  tensor([[256774.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(3147131.5000, grad_fn=<MseLossBackward>)
output :  tensor([[156562.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(8629090., grad_fn=<MseLossBackward>)
output :  tensor([[128851.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(123590.6953, grad_fn=<MseLossBackward>)
output :  tensor([[96152.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(1327770.1250, grad_fn=<MseLossBackward>)
output :  tensor([[154594.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9132e+09, grad_fn=<MseLossBackward>)
output :  tensor([[179685.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(46070.5977, grad_fn=<MseLossBackward>)
output :  tensor([[120727.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(51894.9766, grad_fn=<MseLossBackward>)
output :  tensor([[186960.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7631e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145285.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3277e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150674.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(600528.1250, grad_fn=<MseLossBackward>)
output :  tensor([[188192.]], grad_fn=<AddmmBackward>)
loss:  tensor(195364., grad_fn=<MseLossBackward>)
output :  tensor([[247989.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0329e+09, grad_fn=<MseLossBackward>)
output :  tensor([[93527.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4112530.5000, grad_fn=<MseLossBackward>)
output :  tensor([[235716.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(18345428., grad_fn=<MseLossBackward>)
output :  tensor([[128809.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(95645.2266, grad_fn=<MseLossBackward>)
output :  tensor([[166128.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9544e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113347.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7817e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178217.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(4917583.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163943.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0237e+08, grad_fn=<MseLossBackward>)
output :  tensor([[155726.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3639e+08, grad_fn=<MseLossBackward>)
output :  tensor([[238152.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(718759.5625, grad_fn=<MseLossBackward>)
output :  tensor([[227788.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(9.1271e+08, grad_fn=<MseLossBackward>)
output :  tensor([[126240.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(577006.3750, grad_fn=<MseLossBackward>)
output :  tensor([[127670.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(2791745., grad_fn=<MseLossBackward>)
output :  tensor([[222406.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(21100386., grad_fn=<MseLossBackward>)
output :  tensor([[233433.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(320621.3750, grad_fn=<MseLossBackward>)
output :  tensor([[225487.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1470724.6250, grad_fn=<MseLossBackward>)
output :  tensor([[146889.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1232793.8750, grad_fn=<MseLossBackward>)
output :  tensor([[208480.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2309877.5000, grad_fn=<MseLossBackward>)
output :  tensor([[131029.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2166e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135942.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(11849623., grad_fn=<MseLossBackward>)
output :  tensor([[308866.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(37624040., grad_fn=<MseLossBackward>)
output :  tensor([[142840.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(3388705.7500, grad_fn=<MseLossBackward>)
output :  tensor([[122315.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0598e+09, grad_fn=<MseLossBackward>)
output :  tensor([[108129.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1877242.5000, grad_fn=<MseLossBackward>)
output :  tensor([[155312.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9540e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176629.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6228e+09, grad_fn=<MseLossBackward>)
output :  tensor([[175357.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(5556406.5000, grad_fn=<MseLossBackward>)
output :  tensor([[189700.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2769e+08, grad_fn=<MseLossBackward>)
output :  tensor([[99402.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(357267.7188, grad_fn=<MseLossBackward>)
output :  tensor([[176641.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(5564586., grad_fn=<MseLossBackward>)
output :  tensor([[171196.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(10869488., grad_fn=<MseLossBackward>)
output :  tensor([[138133.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(751255.5625, grad_fn=<MseLossBackward>)
output :  tensor([[259692.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(9.8818e+09, grad_fn=<MseLossBackward>)
output :  tensor([[141760.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2218e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173089.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(7957.1973, grad_fn=<MseLossBackward>)
output :  tensor([[140649.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(421647.3125, grad_fn=<MseLossBackward>)
output :  tensor([[201530.]], grad_fn=<AddmmBackward>)
loss:  tensor(1060900., grad_fn=<MseLossBackward>)
output :  tensor([[168655.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1806924., grad_fn=<MseLossBackward>)
output :  tensor([[239766.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(17920406., grad_fn=<MseLossBackward>)
output :  tensor([[132707.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(3214625., grad_fn=<MseLossBackward>)
output :  tensor([[151295.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(3786794.5000, grad_fn=<MseLossBackward>)
output :  tensor([[211057.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(15546386., grad_fn=<MseLossBackward>)
output :  tensor([[160656.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(18867892., grad_fn=<MseLossBackward>)
output :  tensor([[181438.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(57175100., grad_fn=<MseLossBackward>)
output :  tensor([[133750.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3752e+08, grad_fn=<MseLossBackward>)
output :  tensor([[127962.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(1077168.2500, grad_fn=<MseLossBackward>)
output :  tensor([[137056.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(8662721., grad_fn=<MseLossBackward>)
output :  tensor([[201021.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6894e+09, grad_fn=<MseLossBackward>)
output :  tensor([[165306.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5307e+09, grad_fn=<MseLossBackward>)
output :  tensor([[77698.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1324e+08, grad_fn=<MseLossBackward>)
output :  tensor([[95062.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1157e+08, grad_fn=<MseLossBackward>)
output :  tensor([[258497.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(27088122., grad_fn=<MseLossBackward>)
output :  tensor([[203586.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1714e+09, grad_fn=<MseLossBackward>)
output :  tensor([[115142.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(20270.6406, grad_fn=<MseLossBackward>)
output :  tensor([[156276.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(9.7491e+08, grad_fn=<MseLossBackward>)
output :  tensor([[203811.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6208e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180075.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0864e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159171.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(17404672., grad_fn=<MseLossBackward>)
output :  tensor([[169873.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(16006.2031, grad_fn=<MseLossBackward>)
output :  tensor([[117223.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(4945481., grad_fn=<MseLossBackward>)
output :  tensor([[163445.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(71323832., grad_fn=<MseLossBackward>)
output :  tensor([[193100.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9042e+08, grad_fn=<MseLossBackward>)
output :  tensor([[218157.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1802096.5000, grad_fn=<MseLossBackward>)
output :  tensor([[245265.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4973e+11, grad_fn=<MseLossBackward>)
output :  tensor([[144518.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(6156214., grad_fn=<MseLossBackward>)
output :  tensor([[109411.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(868041.6250, grad_fn=<MseLossBackward>)
output :  tensor([[171557.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0697e+08, grad_fn=<MseLossBackward>)
output :  tensor([[153683.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(10132782., grad_fn=<MseLossBackward>)
output :  tensor([[234635.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(5591451.5000, grad_fn=<MseLossBackward>)
output :  tensor([[114842.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(24680.9004, grad_fn=<MseLossBackward>)
output :  tensor([[178215.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(21947760., grad_fn=<MseLossBackward>)
output :  tensor([[188980.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(5201963., grad_fn=<MseLossBackward>)
output :  tensor([[163120.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4611e+10, grad_fn=<MseLossBackward>)
output :  tensor([[99263.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3355e+08, grad_fn=<MseLossBackward>)
output :  tensor([[242833.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(14697040., grad_fn=<MseLossBackward>)
output :  tensor([[178441.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(5958938.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138942.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1118835., grad_fn=<MseLossBackward>)
output :  tensor([[236367.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1869928., grad_fn=<MseLossBackward>)
output :  tensor([[161488.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2285671.5000, grad_fn=<MseLossBackward>)
output :  tensor([[200378.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5531e+10, grad_fn=<MseLossBackward>)
output :  tensor([[133606.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1940927.8750, grad_fn=<MseLossBackward>)
output :  tensor([[186873.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1870e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135061.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(880225.1250, grad_fn=<MseLossBackward>)
output :  tensor([[224102.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4156e+08, grad_fn=<MseLossBackward>)
output :  tensor([[222259.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6956e+08, grad_fn=<MseLossBackward>)
output :  tensor([[91219.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(1486284.8750, grad_fn=<MseLossBackward>)
output :  tensor([[161587.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(4638168., grad_fn=<MseLossBackward>)
output :  tensor([[242824.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6398e+10, grad_fn=<MseLossBackward>)
output :  tensor([[149297.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(18470520., grad_fn=<MseLossBackward>)
output :  tensor([[110861.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9238e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166228.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2986794., grad_fn=<MseLossBackward>)
output :  tensor([[144370.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(137189.2188, grad_fn=<MseLossBackward>)
output :  tensor([[128259.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(3513.3403, grad_fn=<MseLossBackward>)
output :  tensor([[188637.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9508e+09, grad_fn=<MseLossBackward>)
output :  tensor([[124445.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(3785122.2500, grad_fn=<MseLossBackward>)
output :  tensor([[153506.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2268271.2500, grad_fn=<MseLossBackward>)
output :  tensor([[170092.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2745752.5000, grad_fn=<MseLossBackward>)
output :  tensor([[151586.]], grad_fn=<AddmmBackward>)
loss:  tensor(343396., grad_fn=<MseLossBackward>)
output :  tensor([[156375.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(42571752., grad_fn=<MseLossBackward>)
output :  tensor([[135128.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8267e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134899.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(8404654., grad_fn=<MseLossBackward>)
output :  tensor([[155313.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6613e+08, grad_fn=<MseLossBackward>)
output :  tensor([[145468.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1733789.3750, grad_fn=<MseLossBackward>)
output :  tensor([[164437.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(7220557., grad_fn=<MseLossBackward>)
output :  tensor([[145300.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2532e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150576.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3155175., grad_fn=<MseLossBackward>)
output :  tensor([[185027.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(8836871., grad_fn=<MseLossBackward>)
output :  tensor([[168948.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2610.5713, grad_fn=<MseLossBackward>)
output :  tensor([[179349.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(423129.9375, grad_fn=<MseLossBackward>)
output :  tensor([[221429.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2043693.6250, grad_fn=<MseLossBackward>)
output :  tensor([[113930.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(36363916., grad_fn=<MseLossBackward>)
output :  tensor([[138314.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7995e+08, grad_fn=<MseLossBackward>)
output :  tensor([[283088.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(8477742., grad_fn=<MseLossBackward>)
output :  tensor([[116720.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(518670.0312, grad_fn=<MseLossBackward>)
output :  tensor([[175069.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0188e+09, grad_fn=<MseLossBackward>)
output :  tensor([[185448.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(201040.1406, grad_fn=<MseLossBackward>)
output :  tensor([[180886.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(21285392., grad_fn=<MseLossBackward>)
output :  tensor([[249795.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3529e+08, grad_fn=<MseLossBackward>)
output :  tensor([[217609.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(19276354., grad_fn=<MseLossBackward>)
output :  tensor([[133503.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6195e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174671.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6965e+08, grad_fn=<MseLossBackward>)
output :  tensor([[123020.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(959206., grad_fn=<MseLossBackward>)
output :  tensor([[182183.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5842e+10, grad_fn=<MseLossBackward>)
output :  tensor([[149219.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(14290290., grad_fn=<MseLossBackward>)
output :  tensor([[156265.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(95369872., grad_fn=<MseLossBackward>)
output :  tensor([[206166.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(17889.0625, grad_fn=<MseLossBackward>)
output :  tensor([[145099.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5876e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175066.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(871772.3750, grad_fn=<MseLossBackward>)
output :  tensor([[253568.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7246e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148030.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(938.8479, grad_fn=<MseLossBackward>)
output :  tensor([[201180.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2203369.2500, grad_fn=<MseLossBackward>)
output :  tensor([[165036.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(25867714., grad_fn=<MseLossBackward>)
output :  tensor([[129627.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7328e+09, grad_fn=<MseLossBackward>)
output :  tensor([[138137.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(5701499.5000, grad_fn=<MseLossBackward>)
output :  tensor([[180772.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(10413630., grad_fn=<MseLossBackward>)
output :  tensor([[190918.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(843843.1875, grad_fn=<MseLossBackward>)
output :  tensor([[219338.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8528e+09, grad_fn=<MseLossBackward>)
output :  tensor([[247182.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(96390672., grad_fn=<MseLossBackward>)
output :  tensor([[181081.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9021e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144752.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8358e+09, grad_fn=<MseLossBackward>)
output :  tensor([[143499.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1000781.3750, grad_fn=<MseLossBackward>)
output :  tensor([[74893.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2175e+09, grad_fn=<MseLossBackward>)
output :  tensor([[132909.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(4370843.5000, grad_fn=<MseLossBackward>)
output :  tensor([[131776.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(8273173.5000, grad_fn=<MseLossBackward>)
output :  tensor([[154834.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(696885.8125, grad_fn=<MseLossBackward>)
output :  tensor([[129168.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(4701138.5000, grad_fn=<MseLossBackward>)
output :  tensor([[76026.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(224365.0469, grad_fn=<MseLossBackward>)
output :  tensor([[86960.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(24610126., grad_fn=<MseLossBackward>)
output :  tensor([[244576.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5818e+08, grad_fn=<MseLossBackward>)
output :  tensor([[142237.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8434e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129497.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(1004771.3125, grad_fn=<MseLossBackward>)
output :  tensor([[167857.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(735279.4375, grad_fn=<MseLossBackward>)
output :  tensor([[235880.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(775417.8125, grad_fn=<MseLossBackward>)
output :  tensor([[187619.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(20432236., grad_fn=<MseLossBackward>)
output :  tensor([[158149.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(4619745.5000, grad_fn=<MseLossBackward>)
output :  tensor([[198507.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(368999.3125, grad_fn=<MseLossBackward>)
output :  tensor([[196024.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6790e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136863.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(18593.8789, grad_fn=<MseLossBackward>)
output :  tensor([[153706.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1674395.6250, grad_fn=<MseLossBackward>)
output :  tensor([[136397.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(157695.8594, grad_fn=<MseLossBackward>)
output :  tensor([[193857.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3063e+09, grad_fn=<MseLossBackward>)
output :  tensor([[153727.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(74060.5234, grad_fn=<MseLossBackward>)
output :  tensor([[139411.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1079e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145023.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(15275.4150, grad_fn=<MseLossBackward>)
output :  tensor([[211407.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(350575., grad_fn=<MseLossBackward>)
output :  tensor([[108812.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1890e+08, grad_fn=<MseLossBackward>)
output :  tensor([[168863.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1860453.3750, grad_fn=<MseLossBackward>)
output :  tensor([[129928.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(3719956., grad_fn=<MseLossBackward>)
output :  tensor([[144972.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4108982.5000, grad_fn=<MseLossBackward>)
output :  tensor([[107036.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9939e+09, grad_fn=<MseLossBackward>)
output :  tensor([[139734.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(4994596.5000, grad_fn=<MseLossBackward>)
output :  tensor([[236876.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(768471.3750, grad_fn=<MseLossBackward>)
output :  tensor([[142351.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(7013973., grad_fn=<MseLossBackward>)
output :  tensor([[140264.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(7640214.5000, grad_fn=<MseLossBackward>)
output :  tensor([[166057.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4484e+09, grad_fn=<MseLossBackward>)
output :  tensor([[263271.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1692e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173256.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(3040064.7500, grad_fn=<MseLossBackward>)
output :  tensor([[105756.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(8885802., grad_fn=<MseLossBackward>)
output :  tensor([[198154.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2957e+09, grad_fn=<MseLossBackward>)
output :  tensor([[155727.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(10707007., grad_fn=<MseLossBackward>)
output :  tensor([[160616.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7007e+10, grad_fn=<MseLossBackward>)
output :  tensor([[100857.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(6538369., grad_fn=<MseLossBackward>)
output :  tensor([[123336.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(69522.8594, grad_fn=<MseLossBackward>)
output :  tensor([[153891.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(4446760.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140447.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(200340.1719, grad_fn=<MseLossBackward>)
output :  tensor([[205251.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(27573166., grad_fn=<MseLossBackward>)
output :  tensor([[145683.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(13565410., grad_fn=<MseLossBackward>)
output :  tensor([[260052.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(4960364., grad_fn=<MseLossBackward>)
output :  tensor([[130320.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3928e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163900.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2558750.2500, grad_fn=<MseLossBackward>)
output :  tensor([[188498.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3928, grad_fn=<MseLossBackward>)
output :  tensor([[125530.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4119e+08, grad_fn=<MseLossBackward>)
output :  tensor([[257922.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(62760312., grad_fn=<MseLossBackward>)
output :  tensor([[156019.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(9.5978e+08, grad_fn=<MseLossBackward>)
output :  tensor([[244857.]], grad_fn=<AddmmBackward>)
loss:  tensor(243049., grad_fn=<MseLossBackward>)
output :  tensor([[146403.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(5777563.5000, grad_fn=<MseLossBackward>)
output :  tensor([[208789.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1464440.3750, grad_fn=<MseLossBackward>)
output :  tensor([[171545.]], grad_fn=<AddmmBackward>)
loss:  tensor(731025., grad_fn=<MseLossBackward>)
output :  tensor([[153741.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(66814.1719, grad_fn=<MseLossBackward>)
output :  tensor([[121753.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(14088586., grad_fn=<MseLossBackward>)
output :  tensor([[233466.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8755e+09, grad_fn=<MseLossBackward>)
output :  tensor([[239136.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(744930.8125, grad_fn=<MseLossBackward>)
output :  tensor([[152544.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(628427.8125, grad_fn=<MseLossBackward>)
output :  tensor([[252994.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(3629620.2500, grad_fn=<MseLossBackward>)
output :  tensor([[121089.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(43365208., grad_fn=<MseLossBackward>)
output :  tensor([[177291.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1667730.1250, grad_fn=<MseLossBackward>)
output :  tensor([[163639.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(13247325., grad_fn=<MseLossBackward>)
output :  tensor([[132195.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1428585.2500, grad_fn=<MseLossBackward>)
output :  tensor([[198233.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7243e+09, grad_fn=<MseLossBackward>)
output :  tensor([[167735.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(13954194., grad_fn=<MseLossBackward>)
output :  tensor([[159042.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(15660941., grad_fn=<MseLossBackward>)
output :  tensor([[157599.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(160563., grad_fn=<MseLossBackward>)
output :  tensor([[147463.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(5934324.5000, grad_fn=<MseLossBackward>)
output :  tensor([[173957.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1547e+09, grad_fn=<MseLossBackward>)
output :  tensor([[162047.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(4190912.7500, grad_fn=<MseLossBackward>)
output :  tensor([[373294.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1397e+08, grad_fn=<MseLossBackward>)
output :  tensor([[142254.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3271e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130438.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0194e+09, grad_fn=<MseLossBackward>)
output :  tensor([[279382.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(3349472., grad_fn=<MseLossBackward>)
output :  tensor([[161135.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(748116.8750, grad_fn=<MseLossBackward>)
output :  tensor([[135505.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2517e+08, grad_fn=<MseLossBackward>)
output :  tensor([[227318.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(21917906., grad_fn=<MseLossBackward>)
output :  tensor([[178131.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(5609792., grad_fn=<MseLossBackward>)
output :  tensor([[152406.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(165204.1406, grad_fn=<MseLossBackward>)
output :  tensor([[143975.]], grad_fn=<AddmmBackward>)
loss:  tensor(1050625., grad_fn=<MseLossBackward>)
output :  tensor([[156201.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7254e+08, grad_fn=<MseLossBackward>)
output :  tensor([[100631.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(398654.1250, grad_fn=<MseLossBackward>)
output :  tensor([[82502.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0635e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163451.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2399013.7500, grad_fn=<MseLossBackward>)
output :  tensor([[187576.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6340e+09, grad_fn=<MseLossBackward>)
output :  tensor([[160303.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(5306472., grad_fn=<MseLossBackward>)
output :  tensor([[156079.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2018397.3750, grad_fn=<MseLossBackward>)
output :  tensor([[133751.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(13679480., grad_fn=<MseLossBackward>)
output :  tensor([[210354.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(19402374., grad_fn=<MseLossBackward>)
output :  tensor([[138046.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2123.1936, grad_fn=<MseLossBackward>)
output :  tensor([[180800.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6692e+10, grad_fn=<MseLossBackward>)
output :  tensor([[148057.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(4232663.5000, grad_fn=<MseLossBackward>)
output :  tensor([[110737.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6936e+08, grad_fn=<MseLossBackward>)
output :  tensor([[93926.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(5442.5200, grad_fn=<MseLossBackward>)
output :  tensor([[174451.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(301075.1250, grad_fn=<MseLossBackward>)
output :  tensor([[264304.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(15242680., grad_fn=<MseLossBackward>)
output :  tensor([[140476.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1048128.0625, grad_fn=<MseLossBackward>)
output :  tensor([[159292.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(363401.7500, grad_fn=<MseLossBackward>)
output :  tensor([[135021.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(6360326.5000, grad_fn=<MseLossBackward>)
output :  tensor([[149740.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(58050.8789, grad_fn=<MseLossBackward>)
output :  tensor([[170572.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(7143926.5000, grad_fn=<MseLossBackward>)
output :  tensor([[126172.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(684510.6250, grad_fn=<MseLossBackward>)
output :  tensor([[175869.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(9.5295e+08, grad_fn=<MseLossBackward>)
output :  tensor([[158991.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(3965761., grad_fn=<MseLossBackward>)
output :  tensor([[122267.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(33267030., grad_fn=<MseLossBackward>)
output :  tensor([[160915.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1961e+09, grad_fn=<MseLossBackward>)
output :  tensor([[51756.4336]], grad_fn=<AddmmBackward>)
loss:  tensor(59324.5938, grad_fn=<MseLossBackward>)
output :  tensor([[233629.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2206e+09, grad_fn=<MseLossBackward>)
output :  tensor([[199820.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1390888.5000, grad_fn=<MseLossBackward>)
output :  tensor([[183664.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1784353.2500, grad_fn=<MseLossBackward>)
output :  tensor([[107685.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(2841463.2500, grad_fn=<MseLossBackward>)
output :  tensor([[87395.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(156766.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135892.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(16874894., grad_fn=<MseLossBackward>)
output :  tensor([[216295.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0381e+09, grad_fn=<MseLossBackward>)
output :  tensor([[200573.]], grad_fn=<AddmmBackward>)
loss:  tensor(47983328., grad_fn=<MseLossBackward>)
output :  tensor([[166849.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(3420014.5000, grad_fn=<MseLossBackward>)
output :  tensor([[171399.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7611e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192313.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(5353511.5000, grad_fn=<MseLossBackward>)
output :  tensor([[87876.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(768444., grad_fn=<MseLossBackward>)
output :  tensor([[141530.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(2341330.2500, grad_fn=<MseLossBackward>)
output :  tensor([[111315.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(665435.3125, grad_fn=<MseLossBackward>)
output :  tensor([[148235.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5068e+08, grad_fn=<MseLossBackward>)
output :  tensor([[170889.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5912e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194064.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1959e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180331.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(109747.2656, grad_fn=<MseLossBackward>)
output :  tensor([[100227.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(13891170., grad_fn=<MseLossBackward>)
output :  tensor([[118110.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(372147.6562, grad_fn=<MseLossBackward>)
output :  tensor([[160035.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7432e+08, grad_fn=<MseLossBackward>)
output :  tensor([[202904.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(8436846., grad_fn=<MseLossBackward>)
output :  tensor([[141767.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4982103., grad_fn=<MseLossBackward>)
train_loss: [2.6742682e+09]
epoch_result tensor([0.])
output :  tensor([[156228.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(5161558., grad_fn=<MseLossBackward>)
output :  tensor([[124082.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(4338531., grad_fn=<MseLossBackward>)
output :  tensor([[192421.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(3168177.5000, grad_fn=<MseLossBackward>)
output :  tensor([[176200.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(639225.2500, grad_fn=<MseLossBackward>)
output :  tensor([[154867.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3512e+08, grad_fn=<MseLossBackward>)
output :  tensor([[127273.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(527575.2500, grad_fn=<MseLossBackward>)
output :  tensor([[141827.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(685428.7500, grad_fn=<MseLossBackward>)
output :  tensor([[119297.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(88264.6953, grad_fn=<MseLossBackward>)
output :  tensor([[72381.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9270e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165426.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(328400.6250, grad_fn=<MseLossBackward>)
output :  tensor([[137723.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(5184586.5000, grad_fn=<MseLossBackward>)
output :  tensor([[227222.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(4938534., grad_fn=<MseLossBackward>)
output :  tensor([[166615.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(5687629., grad_fn=<MseLossBackward>)
output :  tensor([[250036.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(113221.7344, grad_fn=<MseLossBackward>)
output :  tensor([[56214.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1475162.1250, grad_fn=<MseLossBackward>)
output :  tensor([[163846.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7429e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174817.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(33192.2852, grad_fn=<MseLossBackward>)
output :  tensor([[157816.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1732308.3750, grad_fn=<MseLossBackward>)
output :  tensor([[276103.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1217712.2500, grad_fn=<MseLossBackward>)
output :  tensor([[194756.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(5034274., grad_fn=<MseLossBackward>)
output :  tensor([[135725.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6604e+10, grad_fn=<MseLossBackward>)
output :  tensor([[196918.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(9239415., grad_fn=<MseLossBackward>)
output :  tensor([[176755.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3179e+09, grad_fn=<MseLossBackward>)
output :  tensor([[152185.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1405817.7500, grad_fn=<MseLossBackward>)
output :  tensor([[172187.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(4786865.5000, grad_fn=<MseLossBackward>)
output :  tensor([[85074.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(105807.8906, grad_fn=<MseLossBackward>)
output :  tensor([[168063.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0320e+09, grad_fn=<MseLossBackward>)
output :  tensor([[182619.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(5664920.5000, grad_fn=<MseLossBackward>)
output :  tensor([[203447.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7094e+09, grad_fn=<MseLossBackward>)
output :  tensor([[111337.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(1787798.7500, grad_fn=<MseLossBackward>)
output :  tensor([[172352.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1829044.8750, grad_fn=<MseLossBackward>)
output :  tensor([[137011.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(261728.1719, grad_fn=<MseLossBackward>)
output :  tensor([[128697.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(91397.5703, grad_fn=<MseLossBackward>)
output :  tensor([[119926.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(182148.9062, grad_fn=<MseLossBackward>)
output :  tensor([[146375.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(8.6295e+08, grad_fn=<MseLossBackward>)
output :  tensor([[169680.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1118e+10, grad_fn=<MseLossBackward>)
output :  tensor([[150437.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(544505.6250, grad_fn=<MseLossBackward>)
output :  tensor([[180944.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(892788.7500, grad_fn=<MseLossBackward>)
output :  tensor([[145304.]], grad_fn=<AddmmBackward>)
loss:  tensor(18524416., grad_fn=<MseLossBackward>)
output :  tensor([[108254.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3322e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133911.]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5754e+09, grad_fn=<MseLossBackward>)
output :  tensor([[135851.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(724706.3750, grad_fn=<MseLossBackward>)
output :  tensor([[139669.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6053e+08, grad_fn=<MseLossBackward>)
output :  tensor([[222475.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(6372548., grad_fn=<MseLossBackward>)
output :  tensor([[133105.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(732415.0625, grad_fn=<MseLossBackward>)
output :  tensor([[149555.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(308181.1250, grad_fn=<MseLossBackward>)
output :  tensor([[113141.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(1303896.3750, grad_fn=<MseLossBackward>)
output :  tensor([[160500.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(250766.2188, grad_fn=<MseLossBackward>)
output :  tensor([[147817.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2262e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192080.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(6457.6289, grad_fn=<MseLossBackward>)
output :  tensor([[135228.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(606816.6875, grad_fn=<MseLossBackward>)
output :  tensor([[124405.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0753e+08, grad_fn=<MseLossBackward>)
output :  tensor([[235771.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(3137714., grad_fn=<MseLossBackward>)
output :  tensor([[162728.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5767e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164322.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(28327842., grad_fn=<MseLossBackward>)
output :  tensor([[204666.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8168e+10, grad_fn=<MseLossBackward>)
output :  tensor([[238366.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3371e+10, grad_fn=<MseLossBackward>)
output :  tensor([[142571.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(862141.2500, grad_fn=<MseLossBackward>)
output :  tensor([[133173.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(683877.3125, grad_fn=<MseLossBackward>)
output :  tensor([[157653.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(7042803.5000, grad_fn=<MseLossBackward>)
output :  tensor([[134538.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(20595288., grad_fn=<MseLossBackward>)
output :  tensor([[179802.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4316e+09, grad_fn=<MseLossBackward>)
output :  tensor([[182120.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(3917863.5000, grad_fn=<MseLossBackward>)
output :  tensor([[161021.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(228947.2969, grad_fn=<MseLossBackward>)
output :  tensor([[142385.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(377130.3125, grad_fn=<MseLossBackward>)
output :  tensor([[143287.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(620599.3125, grad_fn=<MseLossBackward>)
output :  tensor([[142324.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(7156377.5000, grad_fn=<MseLossBackward>)
output :  tensor([[170878.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7345e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193109.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7076e+08, grad_fn=<MseLossBackward>)
output :  tensor([[140867.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(19078742., grad_fn=<MseLossBackward>)
output :  tensor([[173329.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2043246.8750, grad_fn=<MseLossBackward>)
output :  tensor([[179130.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(3495673., grad_fn=<MseLossBackward>)
output :  tensor([[118244.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(10525614., grad_fn=<MseLossBackward>)
output :  tensor([[222540.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2372947.7500, grad_fn=<MseLossBackward>)
output :  tensor([[183935.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(189496.9688, grad_fn=<MseLossBackward>)
output :  tensor([[125954.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(206847.2969, grad_fn=<MseLossBackward>)
output :  tensor([[193479.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(9123515., grad_fn=<MseLossBackward>)
output :  tensor([[174115.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(615489.3125, grad_fn=<MseLossBackward>)
output :  tensor([[203997.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3216e+10, grad_fn=<MseLossBackward>)
output :  tensor([[206320.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(21897574., grad_fn=<MseLossBackward>)
output :  tensor([[166571.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2653e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192321.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(4743752., grad_fn=<MseLossBackward>)
output :  tensor([[110867.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(4547789.5000, grad_fn=<MseLossBackward>)
output :  tensor([[114836.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(5457188., grad_fn=<MseLossBackward>)
output :  tensor([[111731.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(72188.7734, grad_fn=<MseLossBackward>)
output :  tensor([[147454.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(428452.0625, grad_fn=<MseLossBackward>)
output :  tensor([[159091.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3691e+10, grad_fn=<MseLossBackward>)
output :  tensor([[181191.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1420752.2500, grad_fn=<MseLossBackward>)
output :  tensor([[126765.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(539513.1875, grad_fn=<MseLossBackward>)
output :  tensor([[145285.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(81456.7266, grad_fn=<MseLossBackward>)
output :  tensor([[188096.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8298e+09, grad_fn=<MseLossBackward>)
output :  tensor([[117624.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(525387.1250, grad_fn=<MseLossBackward>)
output :  tensor([[200889.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(15128940., grad_fn=<MseLossBackward>)
output :  tensor([[144667.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(110743.3594, grad_fn=<MseLossBackward>)
output :  tensor([[209331.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(12731851., grad_fn=<MseLossBackward>)
output :  tensor([[127209.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1461832.1250, grad_fn=<MseLossBackward>)
output :  tensor([[246043.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(5220368., grad_fn=<MseLossBackward>)
output :  tensor([[232187.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7892e+09, grad_fn=<MseLossBackward>)
output :  tensor([[152493.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4492e+08, grad_fn=<MseLossBackward>)
output :  tensor([[88315.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4615e+08, grad_fn=<MseLossBackward>)
output :  tensor([[189071.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3665e+09, grad_fn=<MseLossBackward>)
output :  tensor([[75493.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(30317326., grad_fn=<MseLossBackward>)
output :  tensor([[138663.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(699314.0625, grad_fn=<MseLossBackward>)
output :  tensor([[78339.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(8060985.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145609.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(7055498., grad_fn=<MseLossBackward>)
output :  tensor([[176459.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(211011.0312, grad_fn=<MseLossBackward>)
output :  tensor([[151988.]], grad_fn=<AddmmBackward>)
loss:  tensor(2286144., grad_fn=<MseLossBackward>)
output :  tensor([[110932.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(12476183., grad_fn=<MseLossBackward>)
output :  tensor([[204599.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2354e+10, grad_fn=<MseLossBackward>)
output :  tensor([[131079.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(6653417., grad_fn=<MseLossBackward>)
output :  tensor([[264403.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4326e+08, grad_fn=<MseLossBackward>)
output :  tensor([[301956.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(64693368., grad_fn=<MseLossBackward>)
output :  tensor([[108364.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(746766., grad_fn=<MseLossBackward>)
output :  tensor([[170625.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3513633., grad_fn=<MseLossBackward>)
output :  tensor([[132385.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9466e+08, grad_fn=<MseLossBackward>)
output :  tensor([[139393.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(154829.9531, grad_fn=<MseLossBackward>)
output :  tensor([[130159.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(8157.7588, grad_fn=<MseLossBackward>)
output :  tensor([[126724.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2974762.5000, grad_fn=<MseLossBackward>)
output :  tensor([[134703.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3521e+08, grad_fn=<MseLossBackward>)
output :  tensor([[225732.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8914e+10, grad_fn=<MseLossBackward>)
output :  tensor([[186421.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3894e+10, grad_fn=<MseLossBackward>)
output :  tensor([[142070.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3346384.2500, grad_fn=<MseLossBackward>)
output :  tensor([[123571.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(15431148., grad_fn=<MseLossBackward>)
output :  tensor([[109983.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(1604398.2500, grad_fn=<MseLossBackward>)
output :  tensor([[254756.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0074e+09, grad_fn=<MseLossBackward>)
output :  tensor([[133611.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1928583.1250, grad_fn=<MseLossBackward>)
output :  tensor([[202982.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(291.1289, grad_fn=<MseLossBackward>)
output :  tensor([[104699.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(40357.0430, grad_fn=<MseLossBackward>)
output :  tensor([[139378.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(327112.5000, grad_fn=<MseLossBackward>)
output :  tensor([[205161.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7399e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180750.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(722898.5000, grad_fn=<MseLossBackward>)
output :  tensor([[185606.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(367254.9375, grad_fn=<MseLossBackward>)
output :  tensor([[165665.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0545e+10, grad_fn=<MseLossBackward>)
output :  tensor([[294496.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6405e+09, grad_fn=<MseLossBackward>)
output :  tensor([[199277.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1897721.5000, grad_fn=<MseLossBackward>)
output :  tensor([[260683.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0214e+10, grad_fn=<MseLossBackward>)
output :  tensor([[214686.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6331e+09, grad_fn=<MseLossBackward>)
output :  tensor([[271676.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0542e+09, grad_fn=<MseLossBackward>)
output :  tensor([[224645.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(417114.1562, grad_fn=<MseLossBackward>)
output :  tensor([[224998.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7889e+10, grad_fn=<MseLossBackward>)
output :  tensor([[199736.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(7487833.5000, grad_fn=<MseLossBackward>)
output :  tensor([[159094.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(9.0568e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133201.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(492453.0625, grad_fn=<MseLossBackward>)
output :  tensor([[133900.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2557800.5000, grad_fn=<MseLossBackward>)
output :  tensor([[94480.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(12112738., grad_fn=<MseLossBackward>)
output :  tensor([[106899.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(1211805.3750, grad_fn=<MseLossBackward>)
output :  tensor([[273587.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0595e+09, grad_fn=<MseLossBackward>)
output :  tensor([[230913.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(16697822., grad_fn=<MseLossBackward>)
output :  tensor([[146370.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1878612.8750, grad_fn=<MseLossBackward>)
output :  tensor([[138544.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1090980.2500, grad_fn=<MseLossBackward>)
output :  tensor([[174074.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(116835.7812, grad_fn=<MseLossBackward>)
output :  tensor([[147968.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(7388288.5000, grad_fn=<MseLossBackward>)
output :  tensor([[164005.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2990e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165042.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1818.2229, grad_fn=<MseLossBackward>)
output :  tensor([[138504.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2264460.7500, grad_fn=<MseLossBackward>)
output :  tensor([[189859.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5373e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113025.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(1051474., grad_fn=<MseLossBackward>)
output :  tensor([[169769.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(4976524.5000, grad_fn=<MseLossBackward>)
output :  tensor([[119949.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(2543.1533, grad_fn=<MseLossBackward>)
output :  tensor([[84930.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(4282022., grad_fn=<MseLossBackward>)
output :  tensor([[179628.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(138349.1250, grad_fn=<MseLossBackward>)
output :  tensor([[112784.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(8319979.5000, grad_fn=<MseLossBackward>)
output :  tensor([[239164.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(26993.4629, grad_fn=<MseLossBackward>)
output :  tensor([[246400.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1961269., grad_fn=<MseLossBackward>)
output :  tensor([[123283.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(38647204., grad_fn=<MseLossBackward>)
output :  tensor([[110834.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(3517764., grad_fn=<MseLossBackward>)
output :  tensor([[288335.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2147e+10, grad_fn=<MseLossBackward>)
output :  tensor([[167955.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(12566471., grad_fn=<MseLossBackward>)
output :  tensor([[124259.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(547877.5625, grad_fn=<MseLossBackward>)
output :  tensor([[146758.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2707e+08, grad_fn=<MseLossBackward>)
output :  tensor([[199312.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1572e+08, grad_fn=<MseLossBackward>)
output :  tensor([[140985.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(200.8420, grad_fn=<MseLossBackward>)
output :  tensor([[155244.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5564e+10, grad_fn=<MseLossBackward>)
output :  tensor([[158518.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(21327656., grad_fn=<MseLossBackward>)
output :  tensor([[129835.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(112502.5938, grad_fn=<MseLossBackward>)
output :  tensor([[240923.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8927e+10, grad_fn=<MseLossBackward>)
output :  tensor([[400278.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2963992.7500, grad_fn=<MseLossBackward>)
output :  tensor([[107924.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1157271.6250, grad_fn=<MseLossBackward>)
output :  tensor([[111946.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(42950512., grad_fn=<MseLossBackward>)
output :  tensor([[160730.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1514707.1250, grad_fn=<MseLossBackward>)
output :  tensor([[131083.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2515e+08, grad_fn=<MseLossBackward>)
output :  tensor([[162088.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5893e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173187.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9927e+09, grad_fn=<MseLossBackward>)
output :  tensor([[103772.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(29624.3262, grad_fn=<MseLossBackward>)
output :  tensor([[139935.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1132594.7500, grad_fn=<MseLossBackward>)
output :  tensor([[364067.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(10408286., grad_fn=<MseLossBackward>)
output :  tensor([[197766.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1622e+09, grad_fn=<MseLossBackward>)
output :  tensor([[172451.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(9296115., grad_fn=<MseLossBackward>)
output :  tensor([[202950.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2593.0374, grad_fn=<MseLossBackward>)
output :  tensor([[137956.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1088501., grad_fn=<MseLossBackward>)
output :  tensor([[193331.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1364662., grad_fn=<MseLossBackward>)
output :  tensor([[135711.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9589e+08, grad_fn=<MseLossBackward>)
output :  tensor([[182777.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3161006.2500, grad_fn=<MseLossBackward>)
output :  tensor([[243243.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1546564.2500, grad_fn=<MseLossBackward>)
output :  tensor([[172278.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2965122.5000, grad_fn=<MseLossBackward>)
output :  tensor([[110189.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(4795381.5000, grad_fn=<MseLossBackward>)
output :  tensor([[266607.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(4188162.2500, grad_fn=<MseLossBackward>)
output :  tensor([[243830.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(38062924., grad_fn=<MseLossBackward>)
output :  tensor([[124428.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(2041527.5000, grad_fn=<MseLossBackward>)
output :  tensor([[213845.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7399e+09, grad_fn=<MseLossBackward>)
output :  tensor([[301730.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5554e+08, grad_fn=<MseLossBackward>)
output :  tensor([[204244.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(7593813.5000, grad_fn=<MseLossBackward>)
output :  tensor([[211847.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6423e+10, grad_fn=<MseLossBackward>)
output :  tensor([[157715.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(34207.6602, grad_fn=<MseLossBackward>)
output :  tensor([[169558.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(186543.0156, grad_fn=<MseLossBackward>)
output :  tensor([[163085.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(37867100., grad_fn=<MseLossBackward>)
output :  tensor([[171797.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(3231624.2500, grad_fn=<MseLossBackward>)
output :  tensor([[232145.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2855e+09, grad_fn=<MseLossBackward>)
output :  tensor([[208598.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3502e+08, grad_fn=<MseLossBackward>)
output :  tensor([[160224.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7488e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129571.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(43189232., grad_fn=<MseLossBackward>)
output :  tensor([[174799.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(4840687.5000, grad_fn=<MseLossBackward>)
output :  tensor([[181019.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2379e+09, grad_fn=<MseLossBackward>)
output :  tensor([[203823.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6402e+10, grad_fn=<MseLossBackward>)
output :  tensor([[133908.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(274445., grad_fn=<MseLossBackward>)
output :  tensor([[150924.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5994e+08, grad_fn=<MseLossBackward>)
output :  tensor([[276901.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(9794.8135, grad_fn=<MseLossBackward>)
output :  tensor([[85541.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(293120.7188, grad_fn=<MseLossBackward>)
output :  tensor([[235414.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1177733.6250, grad_fn=<MseLossBackward>)
output :  tensor([[258452.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0529e+11, grad_fn=<MseLossBackward>)
output :  tensor([[168280.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2957486.2500, grad_fn=<MseLossBackward>)
output :  tensor([[190294.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9986e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150578.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(19547314., grad_fn=<MseLossBackward>)
output :  tensor([[205153.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2051e+09, grad_fn=<MseLossBackward>)
output :  tensor([[127058.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3769301., grad_fn=<MseLossBackward>)
output :  tensor([[148141.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(9871575., grad_fn=<MseLossBackward>)
output :  tensor([[172935.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2631e+08, grad_fn=<MseLossBackward>)
output :  tensor([[185455.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(155654.9062, grad_fn=<MseLossBackward>)
output :  tensor([[127306.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(1707207.6250, grad_fn=<MseLossBackward>)
output :  tensor([[135772.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(528665.3125, grad_fn=<MseLossBackward>)
output :  tensor([[170678.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(5389870., grad_fn=<MseLossBackward>)
output :  tensor([[198476.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6547e+09, grad_fn=<MseLossBackward>)
output :  tensor([[242616.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(146712.9375, grad_fn=<MseLossBackward>)
output :  tensor([[149315.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(32311586., grad_fn=<MseLossBackward>)
output :  tensor([[193104.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(8383558.5000, grad_fn=<MseLossBackward>)
output :  tensor([[165904.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7981e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177254.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(5042551., grad_fn=<MseLossBackward>)
output :  tensor([[186420.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(42516512., grad_fn=<MseLossBackward>)
output :  tensor([[98112.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(1237847.5000, grad_fn=<MseLossBackward>)
output :  tensor([[172635.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1527e+10, grad_fn=<MseLossBackward>)
output :  tensor([[135033.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1120.1572, grad_fn=<MseLossBackward>)
output :  tensor([[123027.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(64439752., grad_fn=<MseLossBackward>)
output :  tensor([[175124.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1263973.2500, grad_fn=<MseLossBackward>)
output :  tensor([[87396.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(5743886.5000, grad_fn=<MseLossBackward>)
output :  tensor([[285452.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(20677482., grad_fn=<MseLossBackward>)
output :  tensor([[171637.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(44054332., grad_fn=<MseLossBackward>)
output :  tensor([[191409.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0096e+10, grad_fn=<MseLossBackward>)
output :  tensor([[242163.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3157e+08, grad_fn=<MseLossBackward>)
output :  tensor([[153014.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(4056762.5000, grad_fn=<MseLossBackward>)
output :  tensor([[123389.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(372509.9688, grad_fn=<MseLossBackward>)
output :  tensor([[122729.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(8007175.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145185.]], grad_fn=<AddmmBackward>)
loss:  tensor(9.1113e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178924.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(24250546., grad_fn=<MseLossBackward>)
output :  tensor([[114944.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0527e+09, grad_fn=<MseLossBackward>)
output :  tensor([[207900.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2122e+10, grad_fn=<MseLossBackward>)
output :  tensor([[246745.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(27516910., grad_fn=<MseLossBackward>)
output :  tensor([[246772.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2028e+10, grad_fn=<MseLossBackward>)
output :  tensor([[221847.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9421e+08, grad_fn=<MseLossBackward>)
output :  tensor([[192832.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5047e+10, grad_fn=<MseLossBackward>)
output :  tensor([[188875.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1892215.1250, grad_fn=<MseLossBackward>)
output :  tensor([[206569.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7655e+10, grad_fn=<MseLossBackward>)
output :  tensor([[186228.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2432e+10, grad_fn=<MseLossBackward>)
output :  tensor([[177549.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1418108.8750, grad_fn=<MseLossBackward>)
output :  tensor([[152014.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(212.5217, grad_fn=<MseLossBackward>)
output :  tensor([[336401.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(358539., grad_fn=<MseLossBackward>)
output :  tensor([[213120.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1254435., grad_fn=<MseLossBackward>)
output :  tensor([[163012.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(9073368., grad_fn=<MseLossBackward>)
output :  tensor([[184375.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2632e+09, grad_fn=<MseLossBackward>)
output :  tensor([[104874.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(15724.7686, grad_fn=<MseLossBackward>)
output :  tensor([[270155.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1136e+10, grad_fn=<MseLossBackward>)
output :  tensor([[172113.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(3191526.5000, grad_fn=<MseLossBackward>)
output :  tensor([[218305.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(23090878., grad_fn=<MseLossBackward>)
output :  tensor([[202636.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3721e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176489.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(7347657.5000, grad_fn=<MseLossBackward>)
output :  tensor([[200467.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1775098.2500, grad_fn=<MseLossBackward>)
output :  tensor([[150707.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(18426764., grad_fn=<MseLossBackward>)
output :  tensor([[150872.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5880e+09, grad_fn=<MseLossBackward>)
output :  tensor([[119250.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(562734.3750, grad_fn=<MseLossBackward>)
output :  tensor([[141002.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1004849.6250, grad_fn=<MseLossBackward>)
output :  tensor([[148904.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(9102.3525, grad_fn=<MseLossBackward>)
output :  tensor([[199418.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6533e+10, grad_fn=<MseLossBackward>)
output :  tensor([[161246.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(3049389., grad_fn=<MseLossBackward>)
output :  tensor([[100949.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2102454.7500, grad_fn=<MseLossBackward>)
output :  tensor([[223561.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7022e+08, grad_fn=<MseLossBackward>)
output :  tensor([[188770.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4151e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175783.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(492760.1250, grad_fn=<MseLossBackward>)
output :  tensor([[81949.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2558.1467, grad_fn=<MseLossBackward>)
output :  tensor([[128008.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(241242.1406, grad_fn=<MseLossBackward>)
output :  tensor([[218900.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(24011838., grad_fn=<MseLossBackward>)
output :  tensor([[143623.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(141834.6250, grad_fn=<MseLossBackward>)
output :  tensor([[133744.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(14021631., grad_fn=<MseLossBackward>)
output :  tensor([[145826.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(10411916., grad_fn=<MseLossBackward>)
output :  tensor([[179909.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7986e+09, grad_fn=<MseLossBackward>)
output :  tensor([[143438.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(315054.1875, grad_fn=<MseLossBackward>)
output :  tensor([[158282.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2951470.2500, grad_fn=<MseLossBackward>)
output :  tensor([[213261.]], grad_fn=<AddmmBackward>)
loss:  tensor(3024121., grad_fn=<MseLossBackward>)
output :  tensor([[137602.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0629e+09, grad_fn=<MseLossBackward>)
output :  tensor([[257576.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(6636581., grad_fn=<MseLossBackward>)
output :  tensor([[156925.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(6627728.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128403.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(9396.8789, grad_fn=<MseLossBackward>)
output :  tensor([[93745.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(1573397.8750, grad_fn=<MseLossBackward>)
output :  tensor([[154424.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8894e+09, grad_fn=<MseLossBackward>)
output :  tensor([[183336.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(11807492., grad_fn=<MseLossBackward>)
output :  tensor([[119982.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(267992.2500, grad_fn=<MseLossBackward>)
output :  tensor([[188041.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6735e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146764.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5245e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151053.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1331643.8750, grad_fn=<MseLossBackward>)
output :  tensor([[189087.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1788154., grad_fn=<MseLossBackward>)
output :  tensor([[253158.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5935e+09, grad_fn=<MseLossBackward>)
output :  tensor([[93985.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(6176234.5000, grad_fn=<MseLossBackward>)
output :  tensor([[237496.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(6269155.5000, grad_fn=<MseLossBackward>)
output :  tensor([[129930.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(2047380.8750, grad_fn=<MseLossBackward>)
output :  tensor([[167161.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(9.7492e+09, grad_fn=<MseLossBackward>)
output :  tensor([[115322.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3479e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175580.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(175574.0938, grad_fn=<MseLossBackward>)
output :  tensor([[166394.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2871e+08, grad_fn=<MseLossBackward>)
output :  tensor([[155772.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3868e+08, grad_fn=<MseLossBackward>)
output :  tensor([[236075.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(8550416., grad_fn=<MseLossBackward>)
output :  tensor([[225142.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0796e+09, grad_fn=<MseLossBackward>)
output :  tensor([[129453.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(6018474., grad_fn=<MseLossBackward>)
output :  tensor([[122540.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(11965708., grad_fn=<MseLossBackward>)
output :  tensor([[224396.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(6777724., grad_fn=<MseLossBackward>)
output :  tensor([[228752.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(27536092., grad_fn=<MseLossBackward>)
output :  tensor([[230785.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(16692076., grad_fn=<MseLossBackward>)
output :  tensor([[147841.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(25156.9336, grad_fn=<MseLossBackward>)
output :  tensor([[211202.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1445329.8750, grad_fn=<MseLossBackward>)
output :  tensor([[132197.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4877e+08, grad_fn=<MseLossBackward>)
output :  tensor([[132887.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(149902.0625, grad_fn=<MseLossBackward>)
output :  tensor([[305076.]], grad_fn=<AddmmBackward>)
loss:  tensor(98485776., grad_fn=<MseLossBackward>)
output :  tensor([[138608.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(5718450., grad_fn=<MseLossBackward>)
output :  tensor([[120671.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8806e+09, grad_fn=<MseLossBackward>)
output :  tensor([[110220.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(518433.7500, grad_fn=<MseLossBackward>)
output :  tensor([[155362.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9370e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178391.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2801e+09, grad_fn=<MseLossBackward>)
output :  tensor([[175824.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(7979389., grad_fn=<MseLossBackward>)
output :  tensor([[190877.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0247e+08, grad_fn=<MseLossBackward>)
output :  tensor([[106201.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(38464124., grad_fn=<MseLossBackward>)
output :  tensor([[176848.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4631037., grad_fn=<MseLossBackward>)
output :  tensor([[169586.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2843386.2500, grad_fn=<MseLossBackward>)
output :  tensor([[138932.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(4514.1602, grad_fn=<MseLossBackward>)
output :  tensor([[254083.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1029e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143267.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3951e+09, grad_fn=<MseLossBackward>)
output :  tensor([[176786.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(14339949., grad_fn=<MseLossBackward>)
output :  tensor([[143865.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(14940399., grad_fn=<MseLossBackward>)
output :  tensor([[198240.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(5104987., grad_fn=<MseLossBackward>)
output :  tensor([[167978.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4087978.5000, grad_fn=<MseLossBackward>)
output :  tensor([[243877.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(14922.1494, grad_fn=<MseLossBackward>)
output :  tensor([[133789.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(505387.6875, grad_fn=<MseLossBackward>)
output :  tensor([[151498.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(4616388., grad_fn=<MseLossBackward>)
output :  tensor([[213957.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1087653.5000, grad_fn=<MseLossBackward>)
output :  tensor([[165691.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(477610.5625, grad_fn=<MseLossBackward>)
output :  tensor([[192618.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(13090263., grad_fn=<MseLossBackward>)
output :  tensor([[135034.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7437e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129911.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(831701.2500, grad_fn=<MseLossBackward>)
output :  tensor([[139950.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2437.8906, grad_fn=<MseLossBackward>)
output :  tensor([[199075.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9597e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164949.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4949e+09, grad_fn=<MseLossBackward>)
output :  tensor([[79200.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6867e+08, grad_fn=<MseLossBackward>)
output :  tensor([[92607.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(65738904., grad_fn=<MseLossBackward>)
output :  tensor([[252640.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(426225.3750, grad_fn=<MseLossBackward>)
output :  tensor([[203768.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1949e+09, grad_fn=<MseLossBackward>)
output :  tensor([[114084.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(838955.8125, grad_fn=<MseLossBackward>)
output :  tensor([[158808.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2318e+08, grad_fn=<MseLossBackward>)
output :  tensor([[204036.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5482e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178157.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4351e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157109.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(4451111., grad_fn=<MseLossBackward>)
output :  tensor([[171474.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2174611., grad_fn=<MseLossBackward>)
output :  tensor([[114024.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(952316.7500, grad_fn=<MseLossBackward>)
output :  tensor([[163647.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(74770880., grad_fn=<MseLossBackward>)
output :  tensor([[193588.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7719e+08, grad_fn=<MseLossBackward>)
output :  tensor([[220862.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1857257.8750, grad_fn=<MseLossBackward>)
output :  tensor([[243297.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5171e+11, grad_fn=<MseLossBackward>)
output :  tensor([[148481.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2194379.2500, grad_fn=<MseLossBackward>)
output :  tensor([[110151.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2793233.2500, grad_fn=<MseLossBackward>)
output :  tensor([[170060.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4018e+08, grad_fn=<MseLossBackward>)
output :  tensor([[150379.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(14448.7910, grad_fn=<MseLossBackward>)
output :  tensor([[236866.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(17826.4219, grad_fn=<MseLossBackward>)
output :  tensor([[117766.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(7652485., grad_fn=<MseLossBackward>)
output :  tensor([[177916.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(24835740., grad_fn=<MseLossBackward>)
output :  tensor([[186636.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(4032.2500, grad_fn=<MseLossBackward>)
output :  tensor([[165301.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3932e+10, grad_fn=<MseLossBackward>)
output :  tensor([[99568.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4480e+08, grad_fn=<MseLossBackward>)
output :  tensor([[239850.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(724174.4375, grad_fn=<MseLossBackward>)
output :  tensor([[177388.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1927411.6250, grad_fn=<MseLossBackward>)
output :  tensor([[141148.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1319375.2500, grad_fn=<MseLossBackward>)
output :  tensor([[235234.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(54792.5703, grad_fn=<MseLossBackward>)
output :  tensor([[164354.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1835940.3750, grad_fn=<MseLossBackward>)
output :  tensor([[200242.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5564e+10, grad_fn=<MseLossBackward>)
output :  tensor([[136780.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(3171126.2500, grad_fn=<MseLossBackward>)
output :  tensor([[185619.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5788e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136811.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(659217.1250, grad_fn=<MseLossBackward>)
output :  tensor([[224243.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3822e+08, grad_fn=<MseLossBackward>)
output :  tensor([[223452.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0475e+08, grad_fn=<MseLossBackward>)
output :  tensor([[89902.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(9547.4277, grad_fn=<MseLossBackward>)
output :  tensor([[161653.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(4928192., grad_fn=<MseLossBackward>)
output :  tensor([[244919.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5866e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145051.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(2615.3635, grad_fn=<MseLossBackward>)
output :  tensor([[106992.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5994e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164977.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(228439.1875, grad_fn=<MseLossBackward>)
output :  tensor([[146048.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(4198337., grad_fn=<MseLossBackward>)
output :  tensor([[127823.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(141399.5000, grad_fn=<MseLossBackward>)
output :  tensor([[190254.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7259e+09, grad_fn=<MseLossBackward>)
output :  tensor([[121396.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1217574.3750, grad_fn=<MseLossBackward>)
output :  tensor([[152250.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(62969.6289, grad_fn=<MseLossBackward>)
output :  tensor([[168568.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(10122439., grad_fn=<MseLossBackward>)
output :  tensor([[151626.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(392541.4062, grad_fn=<MseLossBackward>)
output :  tensor([[159659.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(10499828., grad_fn=<MseLossBackward>)
output :  tensor([[135602.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0770e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131695.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(92882.0859, grad_fn=<MseLossBackward>)
output :  tensor([[154725.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4730e+08, grad_fn=<MseLossBackward>)
output :  tensor([[144173.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(462.2500, grad_fn=<MseLossBackward>)
output :  tensor([[160125.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2637883.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139338.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(8.6660e+08, grad_fn=<MseLossBackward>)
output :  tensor([[146916.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3547454.5000, grad_fn=<MseLossBackward>)
output :  tensor([[183362.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(21504378., grad_fn=<MseLossBackward>)
output :  tensor([[169956.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(914473.8125, grad_fn=<MseLossBackward>)
output :  tensor([[181411.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1992994., grad_fn=<MseLossBackward>)
output :  tensor([[217356.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(6987018.5000, grad_fn=<MseLossBackward>)
output :  tensor([[114060.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(37954648., grad_fn=<MseLossBackward>)
output :  tensor([[141035.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6035e+08, grad_fn=<MseLossBackward>)
output :  tensor([[286988.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(977008.6875, grad_fn=<MseLossBackward>)
output :  tensor([[117396.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1949514., grad_fn=<MseLossBackward>)
output :  tensor([[172090.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2953e+09, grad_fn=<MseLossBackward>)
output :  tensor([[181372.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(13158076., grad_fn=<MseLossBackward>)
output :  tensor([[186383.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(781069.3125, grad_fn=<MseLossBackward>)
output :  tensor([[250268.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1165e+08, grad_fn=<MseLossBackward>)
output :  tensor([[222726.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(527484.4375, grad_fn=<MseLossBackward>)
output :  tensor([[132142.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8869e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176325.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4409e+08, grad_fn=<MseLossBackward>)
output :  tensor([[126785.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(7759010., grad_fn=<MseLossBackward>)
output :  tensor([[181641.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6120e+10, grad_fn=<MseLossBackward>)
output :  tensor([[155871.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(8244615., grad_fn=<MseLossBackward>)
output :  tensor([[155503.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(81056544., grad_fn=<MseLossBackward>)
output :  tensor([[204882.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2007933.2500, grad_fn=<MseLossBackward>)
output :  tensor([[143696.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2536e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174691.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1711272.7500, grad_fn=<MseLossBackward>)
output :  tensor([[249637.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(8.9174e+08, grad_fn=<MseLossBackward>)
output :  tensor([[149318.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1738771.8750, grad_fn=<MseLossBackward>)
output :  tensor([[200571.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(4381761., grad_fn=<MseLossBackward>)
output :  tensor([[162983.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(9202501., grad_fn=<MseLossBackward>)
output :  tensor([[128370.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6298e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136941.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1419635., grad_fn=<MseLossBackward>)
output :  tensor([[182245.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3078270.2500, grad_fn=<MseLossBackward>)
output :  tensor([[194991.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(24916476., grad_fn=<MseLossBackward>)
output :  tensor([[220634.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6739e+09, grad_fn=<MseLossBackward>)
output :  tensor([[250400.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(43557524., grad_fn=<MseLossBackward>)
output :  tensor([[179979.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9327e+10, grad_fn=<MseLossBackward>)
output :  tensor([[146037.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9743e+09, grad_fn=<MseLossBackward>)
output :  tensor([[147195.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(7264962., grad_fn=<MseLossBackward>)
output :  tensor([[74293.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1760e+09, grad_fn=<MseLossBackward>)
output :  tensor([[142678.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(58962000., grad_fn=<MseLossBackward>)
output :  tensor([[132828.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(15436182., grad_fn=<MseLossBackward>)
output :  tensor([[155776.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(3157284.7500, grad_fn=<MseLossBackward>)
output :  tensor([[126563.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(190791.5156, grad_fn=<MseLossBackward>)
output :  tensor([[79159.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(7071693.5000, grad_fn=<MseLossBackward>)
output :  tensor([[84028.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(4113956.5000, grad_fn=<MseLossBackward>)
output :  tensor([[229180.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(7947377.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140650.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9246e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136957.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(41699708., grad_fn=<MseLossBackward>)
output :  tensor([[166647.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(124047.0391, grad_fn=<MseLossBackward>)
output :  tensor([[238155.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(9956391., grad_fn=<MseLossBackward>)
output :  tensor([[190679.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2132695.2500, grad_fn=<MseLossBackward>)
output :  tensor([[152556.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(11860060., grad_fn=<MseLossBackward>)
output :  tensor([[195883.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4064508., grad_fn=<MseLossBackward>)
output :  tensor([[198536.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4795e+09, grad_fn=<MseLossBackward>)
output :  tensor([[138708.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2920520.7500, grad_fn=<MseLossBackward>)
output :  tensor([[154919.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(6450.0977, grad_fn=<MseLossBackward>)
output :  tensor([[135948.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2678.0625, grad_fn=<MseLossBackward>)
output :  tensor([[197019.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0877e+09, grad_fn=<MseLossBackward>)
output :  tensor([[153769.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(53288.8359, grad_fn=<MseLossBackward>)
output :  tensor([[138140.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9927e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145245.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(119478.2422, grad_fn=<MseLossBackward>)
output :  tensor([[205326.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(44532264., grad_fn=<MseLossBackward>)
output :  tensor([[108057.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7898e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166302.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1434717.3750, grad_fn=<MseLossBackward>)
output :  tensor([[125745.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(5081678.5000, grad_fn=<MseLossBackward>)
output :  tensor([[147758.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(575583., grad_fn=<MseLossBackward>)
output :  tensor([[103505.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6911e+09, grad_fn=<MseLossBackward>)
output :  tensor([[138780.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1639280.1250, grad_fn=<MseLossBackward>)
output :  tensor([[229509.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(42131460., grad_fn=<MseLossBackward>)
output :  tensor([[146296.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1680021., grad_fn=<MseLossBackward>)
output :  tensor([[141520.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(16163164., grad_fn=<MseLossBackward>)
output :  tensor([[166449.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4784e+09, grad_fn=<MseLossBackward>)
output :  tensor([[263842.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0045e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176841.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(3390489.2500, grad_fn=<MseLossBackward>)
output :  tensor([[103059.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(80527.3672, grad_fn=<MseLossBackward>)
output :  tensor([[199812.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0354e+09, grad_fn=<MseLossBackward>)
output :  tensor([[167278.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(68538736., grad_fn=<MseLossBackward>)
output :  tensor([[161514.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6618e+10, grad_fn=<MseLossBackward>)
output :  tensor([[97352.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(898067.1875, grad_fn=<MseLossBackward>)
output :  tensor([[123371.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(52126.5977, grad_fn=<MseLossBackward>)
output :  tensor([[155874.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(15667.9980, grad_fn=<MseLossBackward>)
output :  tensor([[140705.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(498325.6875, grad_fn=<MseLossBackward>)
output :  tensor([[201794.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(3219333., grad_fn=<MseLossBackward>)
output :  tensor([[138888.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(9683474., grad_fn=<MseLossBackward>)
output :  tensor([[264581.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(5298916.5000, grad_fn=<MseLossBackward>)
output :  tensor([[130928.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4386e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163239.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(5111273., grad_fn=<MseLossBackward>)
output :  tensor([[188565.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(4312.7949, grad_fn=<MseLossBackward>)
output :  tensor([[125474.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3945e+08, grad_fn=<MseLossBackward>)
output :  tensor([[249926.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(5379.3057, grad_fn=<MseLossBackward>)
output :  tensor([[156740.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(9.1566e+08, grad_fn=<MseLossBackward>)
output :  tensor([[244074.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1627179.2500, grad_fn=<MseLossBackward>)
output :  tensor([[144299.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(89700.2500, grad_fn=<MseLossBackward>)
output :  tensor([[210984.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(969024.8750, grad_fn=<MseLossBackward>)
output :  tensor([[178263.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(34380084., grad_fn=<MseLossBackward>)
output :  tensor([[154847.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(718123.8125, grad_fn=<MseLossBackward>)
output :  tensor([[118901.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(812927.6250, grad_fn=<MseLossBackward>)
output :  tensor([[236256.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5841e+09, grad_fn=<MseLossBackward>)
output :  tensor([[236559.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(11836610., grad_fn=<MseLossBackward>)
output :  tensor([[151294.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(4172955.2500, grad_fn=<MseLossBackward>)
output :  tensor([[252252.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(7008263.5000, grad_fn=<MseLossBackward>)
output :  tensor([[121919.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(54985584., grad_fn=<MseLossBackward>)
output :  tensor([[176519.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(269393.4375, grad_fn=<MseLossBackward>)
output :  tensor([[161067.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1138822.5000, grad_fn=<MseLossBackward>)
output :  tensor([[130938.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(3746.7788, grad_fn=<MseLossBackward>)
output :  tensor([[197311.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5984e+09, grad_fn=<MseLossBackward>)
output :  tensor([[165688.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2850188., grad_fn=<MseLossBackward>)
output :  tensor([[167537.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(20587914., grad_fn=<MseLossBackward>)
output :  tensor([[157568.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(186570., grad_fn=<MseLossBackward>)
output :  tensor([[154285.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(19234804., grad_fn=<MseLossBackward>)
output :  tensor([[178013.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6942e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157652.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(5508555.5000, grad_fn=<MseLossBackward>)
output :  tensor([[371707.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5036e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133476.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(41947480., grad_fn=<MseLossBackward>)
output :  tensor([[130568.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0312e+09, grad_fn=<MseLossBackward>)
output :  tensor([[278221.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(8949446., grad_fn=<MseLossBackward>)
output :  tensor([[164149.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(4619477., grad_fn=<MseLossBackward>)
output :  tensor([[131600.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2322e+08, grad_fn=<MseLossBackward>)
output :  tensor([[237361.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(28750206., grad_fn=<MseLossBackward>)
output :  tensor([[180904.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(163253.8750, grad_fn=<MseLossBackward>)
output :  tensor([[152877.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(770801.6875, grad_fn=<MseLossBackward>)
output :  tensor([[145476.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(226709.8906, grad_fn=<MseLossBackward>)
output :  tensor([[157955.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4334e+08, grad_fn=<MseLossBackward>)
output :  tensor([[102926.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(8566734., grad_fn=<MseLossBackward>)
output :  tensor([[79881.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9529e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166993.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3974789.7500, grad_fn=<MseLossBackward>)
output :  tensor([[187584.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6334e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159242.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1542835.7500, grad_fn=<MseLossBackward>)
output :  tensor([[161303.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(14469703., grad_fn=<MseLossBackward>)
output :  tensor([[137539.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(7982.3057, grad_fn=<MseLossBackward>)
output :  tensor([[208434.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(6170877., grad_fn=<MseLossBackward>)
output :  tensor([[138142.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(20408.8008, grad_fn=<MseLossBackward>)
output :  tensor([[181014.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6637e+10, grad_fn=<MseLossBackward>)
output :  tensor([[141362.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(21507856., grad_fn=<MseLossBackward>)
output :  tensor([[111800.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2948e+08, grad_fn=<MseLossBackward>)
output :  tensor([[93858.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(20119.6484, grad_fn=<MseLossBackward>)
output :  tensor([[175204.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(41967.3633, grad_fn=<MseLossBackward>)
output :  tensor([[266475.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(36906764., grad_fn=<MseLossBackward>)
output :  tensor([[141871.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(138000.6406, grad_fn=<MseLossBackward>)
output :  tensor([[158176.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2953940.5000, grad_fn=<MseLossBackward>)
output :  tensor([[134014.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2294515., grad_fn=<MseLossBackward>)
output :  tensor([[145606.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(15158491., grad_fn=<MseLossBackward>)
output :  tensor([[167895.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(22.4143, grad_fn=<MseLossBackward>)
output :  tensor([[127637.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(406276.7812, grad_fn=<MseLossBackward>)
output :  tensor([[175774.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(9.4708e+08, grad_fn=<MseLossBackward>)
output :  tensor([[158092.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1192737., grad_fn=<MseLossBackward>)
output :  tensor([[116423.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(5883.3691, grad_fn=<MseLossBackward>)
output :  tensor([[159895.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3443e+09, grad_fn=<MseLossBackward>)
output :  tensor([[58456.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(41689620., grad_fn=<MseLossBackward>)
output :  tensor([[229392.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9069e+09, grad_fn=<MseLossBackward>)
output :  tensor([[201964.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(930200., grad_fn=<MseLossBackward>)
output :  tensor([[182344.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(7049440., grad_fn=<MseLossBackward>)
output :  tensor([[107083.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(1172939.7500, grad_fn=<MseLossBackward>)
output :  tensor([[89007.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(4028174.5000, grad_fn=<MseLossBackward>)
output :  tensor([[137579.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(5859425.5000, grad_fn=<MseLossBackward>)
output :  tensor([[216433.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0165e+09, grad_fn=<MseLossBackward>)
output :  tensor([[200315.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(51619736., grad_fn=<MseLossBackward>)
output :  tensor([[164730.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(72883.1250, grad_fn=<MseLossBackward>)
output :  tensor([[170987.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8384e+09, grad_fn=<MseLossBackward>)
output :  tensor([[190561.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(315282.2500, grad_fn=<MseLossBackward>)
output :  tensor([[87974.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(950030.9375, grad_fn=<MseLossBackward>)
output :  tensor([[138421.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2491563.5000, grad_fn=<MseLossBackward>)
output :  tensor([[113423.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(8544294., grad_fn=<MseLossBackward>)
output :  tensor([[147627.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3614e+08, grad_fn=<MseLossBackward>)
output :  tensor([[170473.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5582e+09, grad_fn=<MseLossBackward>)
output :  tensor([[191223.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8980e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180147.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(21618.1875, grad_fn=<MseLossBackward>)
output :  tensor([[96886.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(149002.0312, grad_fn=<MseLossBackward>)
output :  tensor([[115971.]], grad_fn=<AddmmBackward>)
loss:  tensor(2337841., grad_fn=<MseLossBackward>)
output :  tensor([[159119.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1903e+08, grad_fn=<MseLossBackward>)
output :  tensor([[196852.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(9907642., grad_fn=<MseLossBackward>)
output :  tensor([[145370.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1879341.1250, grad_fn=<MseLossBackward>)
train_loss: [2.6743222e+09]
epoch_result tensor([0.])
output :  tensor([[156762.]], grad_fn=<AddmmBackward>)
loss:  tensor(3020644., grad_fn=<MseLossBackward>)
output :  tensor([[119898.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(4415875.5000, grad_fn=<MseLossBackward>)
output :  tensor([[196206.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(4021591.5000, grad_fn=<MseLossBackward>)
output :  tensor([[176637.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(131259.0312, grad_fn=<MseLossBackward>)
output :  tensor([[154215.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6568e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131810.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(14521696., grad_fn=<MseLossBackward>)
output :  tensor([[139171.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3344898., grad_fn=<MseLossBackward>)
output :  tensor([[115486.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(12344133., grad_fn=<MseLossBackward>)
output :  tensor([[72679.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0106e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166015.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(233.9944, grad_fn=<MseLossBackward>)
output :  tensor([[142873.]], grad_fn=<AddmmBackward>)
loss:  tensor(8254129., grad_fn=<MseLossBackward>)
output :  tensor([[225219.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(48290.0625, grad_fn=<MseLossBackward>)
output :  tensor([[167324.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2805834.5000, grad_fn=<MseLossBackward>)
output :  tensor([[246767.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(8599648., grad_fn=<MseLossBackward>)
output :  tensor([[53442.3711]], grad_fn=<AddmmBackward>)
loss:  tensor(2426207.7500, grad_fn=<MseLossBackward>)
output :  tensor([[163171.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4864e+08, grad_fn=<MseLossBackward>)
output :  tensor([[183205.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(67324592., grad_fn=<MseLossBackward>)
output :  tensor([[159776.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(10738115., grad_fn=<MseLossBackward>)
output :  tensor([[274387.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(374964.8750, grad_fn=<MseLossBackward>)
output :  tensor([[197941.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(885863.3125, grad_fn=<MseLossBackward>)
output :  tensor([[135868.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6525e+10, grad_fn=<MseLossBackward>)
output :  tensor([[195462.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2508907.5000, grad_fn=<MseLossBackward>)
output :  tensor([[175943.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3967e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151585.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(343341.0625, grad_fn=<MseLossBackward>)
output :  tensor([[166856.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(9880413., grad_fn=<MseLossBackward>)
output :  tensor([[87262.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(3470157.7500, grad_fn=<MseLossBackward>)
output :  tensor([[166450.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8570e+09, grad_fn=<MseLossBackward>)
output :  tensor([[183032.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(3870257., grad_fn=<MseLossBackward>)
output :  tensor([[202888.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7680e+09, grad_fn=<MseLossBackward>)
output :  tensor([[107781.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(4921361., grad_fn=<MseLossBackward>)
output :  tensor([[171677.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(458815.7188, grad_fn=<MseLossBackward>)
output :  tensor([[137658.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1342774., grad_fn=<MseLossBackward>)
output :  tensor([[129458.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(210172.1094, grad_fn=<MseLossBackward>)
output :  tensor([[120382.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(779564.8125, grad_fn=<MseLossBackward>)
output :  tensor([[145497.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1213e+08, grad_fn=<MseLossBackward>)
output :  tensor([[167860.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1650e+10, grad_fn=<MseLossBackward>)
output :  tensor([[149297.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(162106.8906, grad_fn=<MseLossBackward>)
output :  tensor([[180964.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(930712.4375, grad_fn=<MseLossBackward>)
output :  tensor([[144641.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(13261888., grad_fn=<MseLossBackward>)
output :  tensor([[106897.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8552e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133339.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6684e+09, grad_fn=<MseLossBackward>)
output :  tensor([[129439.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(30920290., grad_fn=<MseLossBackward>)
output :  tensor([[142752.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4816e+08, grad_fn=<MseLossBackward>)
output :  tensor([[227834.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(8035364.5000, grad_fn=<MseLossBackward>)
output :  tensor([[132313.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(4068.0479, grad_fn=<MseLossBackward>)
output :  tensor([[149173.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(30227.0820, grad_fn=<MseLossBackward>)
output :  tensor([[113614.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2607215.7500, grad_fn=<MseLossBackward>)
output :  tensor([[158615.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1917099.8750, grad_fn=<MseLossBackward>)
output :  tensor([[144649.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5351e+09, grad_fn=<MseLossBackward>)
output :  tensor([[191847.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(23265.7812, grad_fn=<MseLossBackward>)
output :  tensor([[132179.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(5154815.5000, grad_fn=<MseLossBackward>)
output :  tensor([[115655.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(31988568., grad_fn=<MseLossBackward>)
output :  tensor([[231257.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(7523106., grad_fn=<MseLossBackward>)
output :  tensor([[161822.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6695e+09, grad_fn=<MseLossBackward>)
output :  tensor([[162276.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(10736681., grad_fn=<MseLossBackward>)
output :  tensor([[203505.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8559e+10, grad_fn=<MseLossBackward>)
output :  tensor([[244445.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2002e+10, grad_fn=<MseLossBackward>)
output :  tensor([[146231.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(7458702.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135873.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(3508948.5000, grad_fn=<MseLossBackward>)
output :  tensor([[154896.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(10764.0625, grad_fn=<MseLossBackward>)
output :  tensor([[130960.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(923445.9375, grad_fn=<MseLossBackward>)
output :  tensor([[179606.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4631e+09, grad_fn=<MseLossBackward>)
output :  tensor([[181018.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(9492657., grad_fn=<MseLossBackward>)
output :  tensor([[165287.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(14344683., grad_fn=<MseLossBackward>)
output :  tensor([[152816.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(96355392., grad_fn=<MseLossBackward>)
output :  tensor([[142466.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1121.2034, grad_fn=<MseLossBackward>)
output :  tensor([[147274.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(5175198.5000, grad_fn=<MseLossBackward>)
output :  tensor([[169752.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8906e+09, grad_fn=<MseLossBackward>)
output :  tensor([[190061.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2568e+08, grad_fn=<MseLossBackward>)
output :  tensor([[139193.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(7256541.5000, grad_fn=<MseLossBackward>)
output :  tensor([[168488.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(11635028., grad_fn=<MseLossBackward>)
output :  tensor([[173511.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(56084888., grad_fn=<MseLossBackward>)
output :  tensor([[115191.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(36588.5156, grad_fn=<MseLossBackward>)
output :  tensor([[215460.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(30688830., grad_fn=<MseLossBackward>)
output :  tensor([[182378.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1258428.2500, grad_fn=<MseLossBackward>)
output :  tensor([[123221.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(5189355., grad_fn=<MseLossBackward>)
output :  tensor([[195765.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(538870.6875, grad_fn=<MseLossBackward>)
output :  tensor([[175651.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(565410., grad_fn=<MseLossBackward>)
output :  tensor([[205857.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2541e+10, grad_fn=<MseLossBackward>)
output :  tensor([[209104.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3593808.7500, grad_fn=<MseLossBackward>)
output :  tensor([[166807.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2822e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193513.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(972966.4375, grad_fn=<MseLossBackward>)
output :  tensor([[111678.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1746321., grad_fn=<MseLossBackward>)
output :  tensor([[114064.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(2448124.7500, grad_fn=<MseLossBackward>)
output :  tensor([[111697.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(91553.5234, grad_fn=<MseLossBackward>)
output :  tensor([[145556.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1545903.6250, grad_fn=<MseLossBackward>)
output :  tensor([[159266.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3627e+10, grad_fn=<MseLossBackward>)
output :  tensor([[177331.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(7121559.5000, grad_fn=<MseLossBackward>)
output :  tensor([[129384.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(3552636., grad_fn=<MseLossBackward>)
output :  tensor([[143288.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2930676.5000, grad_fn=<MseLossBackward>)
output :  tensor([[183740.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3854e+09, grad_fn=<MseLossBackward>)
output :  tensor([[119302.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(5773620.5000, grad_fn=<MseLossBackward>)
output :  tensor([[198707.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2916677., grad_fn=<MseLossBackward>)
output :  tensor([[149034.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(16280595., grad_fn=<MseLossBackward>)
output :  tensor([[209185.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(13795073., grad_fn=<MseLossBackward>)
output :  tensor([[126458.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(210365.5625, grad_fn=<MseLossBackward>)
output :  tensor([[250725.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(5747407., grad_fn=<MseLossBackward>)
output :  tensor([[234075.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5933e+09, grad_fn=<MseLossBackward>)
output :  tensor([[152782.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5720e+08, grad_fn=<MseLossBackward>)
output :  tensor([[83969.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2760e+08, grad_fn=<MseLossBackward>)
output :  tensor([[188121.]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5306e+09, grad_fn=<MseLossBackward>)
output :  tensor([[81399.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(159369.3750, grad_fn=<MseLossBackward>)
output :  tensor([[138907.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(351611.9375, grad_fn=<MseLossBackward>)
output :  tensor([[76225.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(526837.8125, grad_fn=<MseLossBackward>)
output :  tensor([[144480.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2334163.2500, grad_fn=<MseLossBackward>)
output :  tensor([[174270.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2990413.7500, grad_fn=<MseLossBackward>)
output :  tensor([[151665.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(3366651.5000, grad_fn=<MseLossBackward>)
output :  tensor([[109324.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(3703910.7500, grad_fn=<MseLossBackward>)
output :  tensor([[203229.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2661e+10, grad_fn=<MseLossBackward>)
output :  tensor([[128970.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(221818.9219, grad_fn=<MseLossBackward>)
output :  tensor([[267594.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5390e+08, grad_fn=<MseLossBackward>)
output :  tensor([[293679.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6637e+08, grad_fn=<MseLossBackward>)
output :  tensor([[108319.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(671337., grad_fn=<MseLossBackward>)
output :  tensor([[170889.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2593710.2500, grad_fn=<MseLossBackward>)
output :  tensor([[132010.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7649e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136921.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(4320292., grad_fn=<MseLossBackward>)
output :  tensor([[132190.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(3767056.5000, grad_fn=<MseLossBackward>)
output :  tensor([[123877.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1260883.3750, grad_fn=<MseLossBackward>)
output :  tensor([[136147.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1011e+08, grad_fn=<MseLossBackward>)
output :  tensor([[223763.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9695e+10, grad_fn=<MseLossBackward>)
output :  tensor([[187781.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3476e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143701.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(39222.5664, grad_fn=<MseLossBackward>)
output :  tensor([[129348.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(3416432.5000, grad_fn=<MseLossBackward>)
output :  tensor([[112576.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1759851., grad_fn=<MseLossBackward>)
output :  tensor([[251017.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4948e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136547.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2393692.5000, grad_fn=<MseLossBackward>)
output :  tensor([[202238.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(579882.2500, grad_fn=<MseLossBackward>)
output :  tensor([[108348.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(11894308., grad_fn=<MseLossBackward>)
output :  tensor([[139220.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(531851.1250, grad_fn=<MseLossBackward>)
output :  tensor([[203046.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6027e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181299.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1959037.6250, grad_fn=<MseLossBackward>)
output :  tensor([[184142.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(735869.0625, grad_fn=<MseLossBackward>)
output :  tensor([[162916.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1340e+10, grad_fn=<MseLossBackward>)
output :  tensor([[297558.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4019e+09, grad_fn=<MseLossBackward>)
output :  tensor([[197543.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(127003.1406, grad_fn=<MseLossBackward>)
output :  tensor([[257193.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1219e+10, grad_fn=<MseLossBackward>)
output :  tensor([[215560.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5441e+09, grad_fn=<MseLossBackward>)
output :  tensor([[274004.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8486e+09, grad_fn=<MseLossBackward>)
output :  tensor([[225224.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1500242.2500, grad_fn=<MseLossBackward>)
output :  tensor([[220608.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9375e+10, grad_fn=<MseLossBackward>)
output :  tensor([[200835.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(14711540., grad_fn=<MseLossBackward>)
output :  tensor([[158835.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(8.9017e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129638.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(8185991.5000, grad_fn=<MseLossBackward>)
output :  tensor([[136728.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1509020.2500, grad_fn=<MseLossBackward>)
output :  tensor([[92905.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(3630334.7500, grad_fn=<MseLossBackward>)
output :  tensor([[108098.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(9759.2793, grad_fn=<MseLossBackward>)
output :  tensor([[267554.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7633e+09, grad_fn=<MseLossBackward>)
output :  tensor([[237697.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(7278276.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145706.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(499407.2188, grad_fn=<MseLossBackward>)
output :  tensor([[138809.]], grad_fn=<AddmmBackward>)
loss:  tensor(1713481., grad_fn=<MseLossBackward>)
output :  tensor([[171891.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3391985.5000, grad_fn=<MseLossBackward>)
output :  tensor([[147572.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(5391901.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162617.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0165e+09, grad_fn=<MseLossBackward>)
output :  tensor([[165066.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(4370.4492, grad_fn=<MseLossBackward>)
output :  tensor([[134962.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(4151979.2500, grad_fn=<MseLossBackward>)
output :  tensor([[190571.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6337e+09, grad_fn=<MseLossBackward>)
output :  tensor([[111847.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(23368.3770, grad_fn=<MseLossBackward>)
output :  tensor([[178099.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(37198752., grad_fn=<MseLossBackward>)
output :  tensor([[120927.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(859720.1250, grad_fn=<MseLossBackward>)
output :  tensor([[89194.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(4815179., grad_fn=<MseLossBackward>)
output :  tensor([[177808.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4800755., grad_fn=<MseLossBackward>)
output :  tensor([[111830.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(3725774.5000, grad_fn=<MseLossBackward>)
output :  tensor([[235099.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(15210609., grad_fn=<MseLossBackward>)
output :  tensor([[242847.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4631507.5000, grad_fn=<MseLossBackward>)
output :  tensor([[129718.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(47602.3750, grad_fn=<MseLossBackward>)
output :  tensor([[110265.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(1708106., grad_fn=<MseLossBackward>)
output :  tensor([[285389.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3032e+10, grad_fn=<MseLossBackward>)
output :  tensor([[173382.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(3545571.2500, grad_fn=<MseLossBackward>)
output :  tensor([[128137.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(9844642., grad_fn=<MseLossBackward>)
output :  tensor([[145603.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6198e+08, grad_fn=<MseLossBackward>)
output :  tensor([[199475.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1098e+08, grad_fn=<MseLossBackward>)
output :  tensor([[141469.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(220356.8906, grad_fn=<MseLossBackward>)
output :  tensor([[156607.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5226e+10, grad_fn=<MseLossBackward>)
output :  tensor([[149648.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(18079106., grad_fn=<MseLossBackward>)
output :  tensor([[132065.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(6582191., grad_fn=<MseLossBackward>)
output :  tensor([[243584.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8202e+10, grad_fn=<MseLossBackward>)
output :  tensor([[405341.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(11162490., grad_fn=<MseLossBackward>)
output :  tensor([[109005.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(30.8546, grad_fn=<MseLossBackward>)
output :  tensor([[116888.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(2598090.7500, grad_fn=<MseLossBackward>)
output :  tensor([[156257.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(10516137., grad_fn=<MseLossBackward>)
output :  tensor([[133568.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1746e+08, grad_fn=<MseLossBackward>)
output :  tensor([[160774.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7486e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174831.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2032e+09, grad_fn=<MseLossBackward>)
output :  tensor([[105164.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2448051.5000, grad_fn=<MseLossBackward>)
output :  tensor([[142043.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1089283.6250, grad_fn=<MseLossBackward>)
output :  tensor([[363235.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(16473959., grad_fn=<MseLossBackward>)
output :  tensor([[199482.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9721e+09, grad_fn=<MseLossBackward>)
output :  tensor([[177283.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3180092., grad_fn=<MseLossBackward>)
output :  tensor([[200549.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(5526686.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139884.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(782672., grad_fn=<MseLossBackward>)
output :  tensor([[192970.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2339991.7500, grad_fn=<MseLossBackward>)
output :  tensor([[135912.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0725e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175547.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(29729586., grad_fn=<MseLossBackward>)
output :  tensor([[237875.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(17013304., grad_fn=<MseLossBackward>)
output :  tensor([[175112.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1236856.7500, grad_fn=<MseLossBackward>)
output :  tensor([[109689.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2853565.5000, grad_fn=<MseLossBackward>)
output :  tensor([[263049.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2283215.5000, grad_fn=<MseLossBackward>)
output :  tensor([[248215.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3185890.2500, grad_fn=<MseLossBackward>)
output :  tensor([[123883.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(780489.4375, grad_fn=<MseLossBackward>)
output :  tensor([[211768.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9982e+09, grad_fn=<MseLossBackward>)
output :  tensor([[300420.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1900e+08, grad_fn=<MseLossBackward>)
output :  tensor([[206413.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(343414.3125, grad_fn=<MseLossBackward>)
output :  tensor([[214370.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5783e+10, grad_fn=<MseLossBackward>)
output :  tensor([[160643.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(7525335., grad_fn=<MseLossBackward>)
output :  tensor([[169588.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(161051.7188, grad_fn=<MseLossBackward>)
output :  tensor([[161754.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(23259822., grad_fn=<MseLossBackward>)
output :  tensor([[166750.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(10556813., grad_fn=<MseLossBackward>)
output :  tensor([[233226.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2092e+09, grad_fn=<MseLossBackward>)
output :  tensor([[214069.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3675e+08, grad_fn=<MseLossBackward>)
output :  tensor([[161717.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1660e+08, grad_fn=<MseLossBackward>)
output :  tensor([[125525.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(6378466., grad_fn=<MseLossBackward>)
output :  tensor([[177312.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(97773.4688, grad_fn=<MseLossBackward>)
output :  tensor([[178145.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7001e+09, grad_fn=<MseLossBackward>)
output :  tensor([[201721.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7209e+10, grad_fn=<MseLossBackward>)
output :  tensor([[137154.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(7412602., grad_fn=<MseLossBackward>)
output :  tensor([[155150.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1256e+09, grad_fn=<MseLossBackward>)
output :  tensor([[278838.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3380542., grad_fn=<MseLossBackward>)
output :  tensor([[86661.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(2760192.7500, grad_fn=<MseLossBackward>)
output :  tensor([[237683.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1401412., grad_fn=<MseLossBackward>)
output :  tensor([[254475.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0788e+11, grad_fn=<MseLossBackward>)
output :  tensor([[170196.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(38772.0703, grad_fn=<MseLossBackward>)
output :  tensor([[190996.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9363e+09, grad_fn=<MseLossBackward>)
output :  tensor([[155512.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(262896.5312, grad_fn=<MseLossBackward>)
output :  tensor([[205960.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1010e+09, grad_fn=<MseLossBackward>)
output :  tensor([[128404.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(354601.6562, grad_fn=<MseLossBackward>)
output :  tensor([[144734.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(70540.0391, grad_fn=<MseLossBackward>)
output :  tensor([[169603.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3460e+08, grad_fn=<MseLossBackward>)
output :  tensor([[187067.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1481849.7500, grad_fn=<MseLossBackward>)
output :  tensor([[125249.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(562687.5000, grad_fn=<MseLossBackward>)
output :  tensor([[136941.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(195018.8438, grad_fn=<MseLossBackward>)
output :  tensor([[174736.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3017114.7500, grad_fn=<MseLossBackward>)
output :  tensor([[196180.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8966e+09, grad_fn=<MseLossBackward>)
output :  tensor([[243354.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(125592.7188, grad_fn=<MseLossBackward>)
output :  tensor([[150595.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(19399758., grad_fn=<MseLossBackward>)
output :  tensor([[199834.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(14701473., grad_fn=<MseLossBackward>)
output :  tensor([[165241.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5120e+08, grad_fn=<MseLossBackward>)
output :  tensor([[194604.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2816e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177633.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(5137659.5000, grad_fn=<MseLossBackward>)
output :  tensor([[97312.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(97876.1016, grad_fn=<MseLossBackward>)
output :  tensor([[171621.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1746e+10, grad_fn=<MseLossBackward>)
output :  tensor([[132877.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(4503945., grad_fn=<MseLossBackward>)
output :  tensor([[121574.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(43219632., grad_fn=<MseLossBackward>)
output :  tensor([[171682.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(5370444., grad_fn=<MseLossBackward>)
output :  tensor([[85595.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(355141.5000, grad_fn=<MseLossBackward>)
output :  tensor([[292247.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(5050835., grad_fn=<MseLossBackward>)
output :  tensor([[166079.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1164409.6250, grad_fn=<MseLossBackward>)
output :  tensor([[192514.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9784e+10, grad_fn=<MseLossBackward>)
output :  tensor([[239844.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(9.7069e+08, grad_fn=<MseLossBackward>)
output :  tensor([[151326.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(106357.5156, grad_fn=<MseLossBackward>)
output :  tensor([[123121.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(771679.8750, grad_fn=<MseLossBackward>)
output :  tensor([[117163.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(7489244.5000, grad_fn=<MseLossBackward>)
output :  tensor([[147531.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0583e+09, grad_fn=<MseLossBackward>)
output :  tensor([[176961.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(8771963., grad_fn=<MseLossBackward>)
output :  tensor([[112558.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(9.0349e+08, grad_fn=<MseLossBackward>)
output :  tensor([[203873.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3025e+10, grad_fn=<MseLossBackward>)
output :  tensor([[229904.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3446e+08, grad_fn=<MseLossBackward>)
output :  tensor([[248315.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1573e+10, grad_fn=<MseLossBackward>)
output :  tensor([[218826.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0697e+08, grad_fn=<MseLossBackward>)
output :  tensor([[192713.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5077e+10, grad_fn=<MseLossBackward>)
output :  tensor([[188291.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(626200.1875, grad_fn=<MseLossBackward>)
output :  tensor([[205271.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8224e+10, grad_fn=<MseLossBackward>)
output :  tensor([[186984.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2206e+10, grad_fn=<MseLossBackward>)
output :  tensor([[178370.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(136819.0781, grad_fn=<MseLossBackward>)
output :  tensor([[149371.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(6908108.5000, grad_fn=<MseLossBackward>)
output :  tensor([[329581.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(55030432., grad_fn=<MseLossBackward>)
output :  tensor([[209192.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(7882846., grad_fn=<MseLossBackward>)
output :  tensor([[153946.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(36644864., grad_fn=<MseLossBackward>)
output :  tensor([[184084.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2966e+09, grad_fn=<MseLossBackward>)
output :  tensor([[108990.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(15926709., grad_fn=<MseLossBackward>)
output :  tensor([[268486.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2090e+10, grad_fn=<MseLossBackward>)
output :  tensor([[169732.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(17365060., grad_fn=<MseLossBackward>)
output :  tensor([[216975.]], grad_fn=<AddmmBackward>)
loss:  tensor(12075625., grad_fn=<MseLossBackward>)
output :  tensor([[201046.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9815e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181027.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3339756.2500, grad_fn=<MseLossBackward>)
output :  tensor([[199203.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(6741650., grad_fn=<MseLossBackward>)
output :  tensor([[152669.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(5430793.5000, grad_fn=<MseLossBackward>)
output :  tensor([[150173.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5174e+09, grad_fn=<MseLossBackward>)
output :  tensor([[119335.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(698582.5625, grad_fn=<MseLossBackward>)
output :  tensor([[140951.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(904727.9375, grad_fn=<MseLossBackward>)
output :  tensor([[145887.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(9686781., grad_fn=<MseLossBackward>)
output :  tensor([[200968.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6137e+10, grad_fn=<MseLossBackward>)
output :  tensor([[159294.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(42127.5625, grad_fn=<MseLossBackward>)
output :  tensor([[100973.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(2171916., grad_fn=<MseLossBackward>)
output :  tensor([[222590.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0308e+08, grad_fn=<MseLossBackward>)
output :  tensor([[188659.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3635e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173210.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(10723988., grad_fn=<MseLossBackward>)
output :  tensor([[87278.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(27866686., grad_fn=<MseLossBackward>)
output :  tensor([[130149.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2721417.2500, grad_fn=<MseLossBackward>)
output :  tensor([[214933.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(870518.1875, grad_fn=<MseLossBackward>)
output :  tensor([[143349.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(422947., grad_fn=<MseLossBackward>)
output :  tensor([[131881.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(3540806.7500, grad_fn=<MseLossBackward>)
output :  tensor([[141451.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1317975.7500, grad_fn=<MseLossBackward>)
output :  tensor([[178807.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7063e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145064.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1134091.8750, grad_fn=<MseLossBackward>)
output :  tensor([[160345.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(119618.7109, grad_fn=<MseLossBackward>)
output :  tensor([[216065.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1134391.3750, grad_fn=<MseLossBackward>)
output :  tensor([[137221.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0382e+09, grad_fn=<MseLossBackward>)
output :  tensor([[258396.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(11534302., grad_fn=<MseLossBackward>)
output :  tensor([[160185.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(470103.0625, grad_fn=<MseLossBackward>)
output :  tensor([[131540.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(9242835., grad_fn=<MseLossBackward>)
output :  tensor([[95028.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(836.0230, grad_fn=<MseLossBackward>)
output :  tensor([[156092.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1255e+09, grad_fn=<MseLossBackward>)
output :  tensor([[176976.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(8544386., grad_fn=<MseLossBackward>)
output :  tensor([[117841.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(7068661., grad_fn=<MseLossBackward>)
output :  tensor([[185346.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9013e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145991.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4211e+09, grad_fn=<MseLossBackward>)
output :  tensor([[149225.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(454760.5625, grad_fn=<MseLossBackward>)
output :  tensor([[187815.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(4249.4102, grad_fn=<MseLossBackward>)
output :  tensor([[251024.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7684e+09, grad_fn=<MseLossBackward>)
output :  tensor([[92913.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(1999064.6250, grad_fn=<MseLossBackward>)
output :  tensor([[236466.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(12485512., grad_fn=<MseLossBackward>)
output :  tensor([[123128.4922]], grad_fn=<AddmmBackward>)
loss:  tensor(28853096., grad_fn=<MseLossBackward>)
output :  tensor([[166997.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(9.7817e+09, grad_fn=<MseLossBackward>)
output :  tensor([[114590.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1289e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176680.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(462740.0625, grad_fn=<MseLossBackward>)
output :  tensor([[165418.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7697e+08, grad_fn=<MseLossBackward>)
output :  tensor([[154664.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8393e+08, grad_fn=<MseLossBackward>)
output :  tensor([[235807.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(10193054., grad_fn=<MseLossBackward>)
output :  tensor([[224642.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1127e+09, grad_fn=<MseLossBackward>)
output :  tensor([[130099.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(9609225., grad_fn=<MseLossBackward>)
output :  tensor([[125830.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(28645.5625, grad_fn=<MseLossBackward>)
output :  tensor([[222235.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(22704332., grad_fn=<MseLossBackward>)
output :  tensor([[226445.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(57068344., grad_fn=<MseLossBackward>)
output :  tensor([[224737.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(3851897., grad_fn=<MseLossBackward>)
output :  tensor([[147813.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(34747.2891, grad_fn=<MseLossBackward>)
output :  tensor([[212751.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(7570838., grad_fn=<MseLossBackward>)
output :  tensor([[130350.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0714e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133851.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1825876.5000, grad_fn=<MseLossBackward>)
output :  tensor([[306156.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(78200856., grad_fn=<MseLossBackward>)
output :  tensor([[141761.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(579501.5625, grad_fn=<MseLossBackward>)
output :  tensor([[122449.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0746e+09, grad_fn=<MseLossBackward>)
output :  tensor([[109575.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(5644.9395, grad_fn=<MseLossBackward>)
output :  tensor([[154801.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1325e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178408.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2769e+09, grad_fn=<MseLossBackward>)
output :  tensor([[172624.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(140660.1562, grad_fn=<MseLossBackward>)
output :  tensor([[189981.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2141e+08, grad_fn=<MseLossBackward>)
output :  tensor([[102518.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(6340363.5000, grad_fn=<MseLossBackward>)
output :  tensor([[177777.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1495385., grad_fn=<MseLossBackward>)
output :  tensor([[169107.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1457452.5000, grad_fn=<MseLossBackward>)
output :  tensor([[142907.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(15269655., grad_fn=<MseLossBackward>)
output :  tensor([[258777.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0065e+10, grad_fn=<MseLossBackward>)
output :  tensor([[141471.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1890e+09, grad_fn=<MseLossBackward>)
output :  tensor([[176439.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(11828441., grad_fn=<MseLossBackward>)
output :  tensor([[141532.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2347694.2500, grad_fn=<MseLossBackward>)
output :  tensor([[201542.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1087034.2500, grad_fn=<MseLossBackward>)
output :  tensor([[169469.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(281562.8750, grad_fn=<MseLossBackward>)
output :  tensor([[241537.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(6063906., grad_fn=<MseLossBackward>)
output :  tensor([[132848.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2728278., grad_fn=<MseLossBackward>)
output :  tensor([[150987.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2679973.7500, grad_fn=<MseLossBackward>)
output :  tensor([[211012.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(15896667., grad_fn=<MseLossBackward>)
output :  tensor([[161755.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(10527591., grad_fn=<MseLossBackward>)
output :  tensor([[187512.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2211215.5000, grad_fn=<MseLossBackward>)
output :  tensor([[131656.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4764e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128068.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(867677.6875, grad_fn=<MseLossBackward>)
output :  tensor([[142319.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(5380370., grad_fn=<MseLossBackward>)
output :  tensor([[197364.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2035e+09, grad_fn=<MseLossBackward>)
output :  tensor([[165678.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5683e+09, grad_fn=<MseLossBackward>)
output :  tensor([[76140.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6051e+08, grad_fn=<MseLossBackward>)
output :  tensor([[96396.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4152e+08, grad_fn=<MseLossBackward>)
output :  tensor([[247642.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(31927974., grad_fn=<MseLossBackward>)
output :  tensor([[200842.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8245e+09, grad_fn=<MseLossBackward>)
output :  tensor([[115986.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(972380.8750, grad_fn=<MseLossBackward>)
output :  tensor([[159660.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7503e+08, grad_fn=<MseLossBackward>)
output :  tensor([[206412.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8462e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177503.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5556e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157215.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(4908855.5000, grad_fn=<MseLossBackward>)
output :  tensor([[166837.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(10002493., grad_fn=<MseLossBackward>)
output :  tensor([[120203.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(27075112., grad_fn=<MseLossBackward>)
output :  tensor([[163396.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(70503840., grad_fn=<MseLossBackward>)
output :  tensor([[191685.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3147e+08, grad_fn=<MseLossBackward>)
output :  tensor([[217373.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4520142., grad_fn=<MseLossBackward>)
output :  tensor([[243720.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5128e+11, grad_fn=<MseLossBackward>)
output :  tensor([[144670.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(5425405.5000, grad_fn=<MseLossBackward>)
output :  tensor([[107050.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2043023.5000, grad_fn=<MseLossBackward>)
output :  tensor([[168835.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7068e+08, grad_fn=<MseLossBackward>)
output :  tensor([[155284.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(22892188., grad_fn=<MseLossBackward>)
output :  tensor([[237723.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(522887.1562, grad_fn=<MseLossBackward>)
output :  tensor([[116869.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(3496666.2500, grad_fn=<MseLossBackward>)
output :  tensor([[179620.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(10752456., grad_fn=<MseLossBackward>)
output :  tensor([[188920.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(4930204., grad_fn=<MseLossBackward>)
output :  tensor([[163203.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4585e+10, grad_fn=<MseLossBackward>)
output :  tensor([[98163.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9460e+08, grad_fn=<MseLossBackward>)
output :  tensor([[234910.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(16726183., grad_fn=<MseLossBackward>)
output :  tensor([[177548.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2397223.2500, grad_fn=<MseLossBackward>)
output :  tensor([[139200.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(638575.8125, grad_fn=<MseLossBackward>)
output :  tensor([[232257.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(7522506., grad_fn=<MseLossBackward>)
output :  tensor([[160596.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(5776136.5000, grad_fn=<MseLossBackward>)
output :  tensor([[199223.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5820e+10, grad_fn=<MseLossBackward>)
output :  tensor([[133439.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2435940.5000, grad_fn=<MseLossBackward>)
output :  tensor([[185344.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4495e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134491.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2275100.7500, grad_fn=<MseLossBackward>)
output :  tensor([[221681.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0501e+08, grad_fn=<MseLossBackward>)
output :  tensor([[224312.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5985e+08, grad_fn=<MseLossBackward>)
output :  tensor([[93462.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(11991774., grad_fn=<MseLossBackward>)
output :  tensor([[157956.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2183699., grad_fn=<MseLossBackward>)
output :  tensor([[242152.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6570e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145883.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(780241., grad_fn=<MseLossBackward>)
output :  tensor([[107691.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6558e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163807.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(479599.5312, grad_fn=<MseLossBackward>)
output :  tensor([[145287.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1656409.2500, grad_fn=<MseLossBackward>)
output :  tensor([[127417.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(612000.6250, grad_fn=<MseLossBackward>)
output :  tensor([[188221.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0095e+09, grad_fn=<MseLossBackward>)
output :  tensor([[125484.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(8905189., grad_fn=<MseLossBackward>)
output :  tensor([[150539.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2133197.2500, grad_fn=<MseLossBackward>)
output :  tensor([[168556.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(10199241., grad_fn=<MseLossBackward>)
output :  tensor([[147424.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(12783977., grad_fn=<MseLossBackward>)
output :  tensor([[161398.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2254736.7500, grad_fn=<MseLossBackward>)
output :  tensor([[135458.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0004e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134766.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(7655511., grad_fn=<MseLossBackward>)
output :  tensor([[155074.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5839e+08, grad_fn=<MseLossBackward>)
output :  tensor([[144488.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(113484.7656, grad_fn=<MseLossBackward>)
output :  tensor([[160321.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2039987.3750, grad_fn=<MseLossBackward>)
output :  tensor([[144229.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1785e+09, grad_fn=<MseLossBackward>)
output :  tensor([[149499.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(489562.5938, grad_fn=<MseLossBackward>)
output :  tensor([[185652.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(5510169.5000, grad_fn=<MseLossBackward>)
output :  tensor([[170387.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1925980.1250, grad_fn=<MseLossBackward>)
output :  tensor([[180818.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(670146.8750, grad_fn=<MseLossBackward>)
output :  tensor([[218353.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2712094.2500, grad_fn=<MseLossBackward>)
output :  tensor([[111140.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(10502157., grad_fn=<MseLossBackward>)
output :  tensor([[139166.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0355e+08, grad_fn=<MseLossBackward>)
output :  tensor([[285855.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(20871.2188, grad_fn=<MseLossBackward>)
output :  tensor([[116499.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(249890.6406, grad_fn=<MseLossBackward>)
output :  tensor([[176528.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8898e+09, grad_fn=<MseLossBackward>)
output :  tensor([[181465.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(12489708., grad_fn=<MseLossBackward>)
output :  tensor([[187907.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(5797561., grad_fn=<MseLossBackward>)
output :  tensor([[253281.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7168e+08, grad_fn=<MseLossBackward>)
output :  tensor([[217158.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(23436038., grad_fn=<MseLossBackward>)
output :  tensor([[134914.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4181e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176372.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4628e+08, grad_fn=<MseLossBackward>)
output :  tensor([[125118.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1250238.5000, grad_fn=<MseLossBackward>)
output :  tensor([[182860.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5495e+10, grad_fn=<MseLossBackward>)
output :  tensor([[150876.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(4508854., grad_fn=<MseLossBackward>)
output :  tensor([[155097.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(73916472., grad_fn=<MseLossBackward>)
output :  tensor([[207823.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2322195., grad_fn=<MseLossBackward>)
output :  tensor([[143986.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3194e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176302.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(91440.0938, grad_fn=<MseLossBackward>)
output :  tensor([[247986.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9313e+08, grad_fn=<MseLossBackward>)
output :  tensor([[147219.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(609692.5625, grad_fn=<MseLossBackward>)
output :  tensor([[202017.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(419397.9062, grad_fn=<MseLossBackward>)
output :  tensor([[157986.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(3855025.5000, grad_fn=<MseLossBackward>)
output :  tensor([[125795.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4285e+09, grad_fn=<MseLossBackward>)
output :  tensor([[138498.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(7551590., grad_fn=<MseLossBackward>)
output :  tensor([[179819.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(17478018., grad_fn=<MseLossBackward>)
output :  tensor([[199620.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(92550712., grad_fn=<MseLossBackward>)
output :  tensor([[215371.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4212e+09, grad_fn=<MseLossBackward>)
output :  tensor([[253084.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(15332486., grad_fn=<MseLossBackward>)
output :  tensor([[178944.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9616e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145343.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8991e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145107.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(369246.1250, grad_fn=<MseLossBackward>)
output :  tensor([[71632.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0006e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136198.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1436664.3750, grad_fn=<MseLossBackward>)
output :  tensor([[128058.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(708056.5000, grad_fn=<MseLossBackward>)
output :  tensor([[155151.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1325520.5000, grad_fn=<MseLossBackward>)
output :  tensor([[130782.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(14306006., grad_fn=<MseLossBackward>)
output :  tensor([[77864.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(1861156.7500, grad_fn=<MseLossBackward>)
output :  tensor([[84717.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(7386844.5000, grad_fn=<MseLossBackward>)
output :  tensor([[241390.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(88174448., grad_fn=<MseLossBackward>)
output :  tensor([[139599.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3440e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130991.1016]], grad_fn=<AddmmBackward>)
loss:  tensor(241180.7500, grad_fn=<MseLossBackward>)
output :  tensor([[166015.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(970071.1250, grad_fn=<MseLossBackward>)
output :  tensor([[235010.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(116.2354, grad_fn=<MseLossBackward>)
output :  tensor([[184009.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(66111128., grad_fn=<MseLossBackward>)
output :  tensor([[159620.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(13108925., grad_fn=<MseLossBackward>)
output :  tensor([[199469.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2464360.2500, grad_fn=<MseLossBackward>)
output :  tensor([[195888.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6902e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137950.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(903153.2500, grad_fn=<MseLossBackward>)
output :  tensor([[153319.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2825656., grad_fn=<MseLossBackward>)
output :  tensor([[134627.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1883756.2500, grad_fn=<MseLossBackward>)
output :  tensor([[196321.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1342e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158379.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(19182210., grad_fn=<MseLossBackward>)
output :  tensor([[139228.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0911e+09, grad_fn=<MseLossBackward>)
output :  tensor([[139917.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(24824528., grad_fn=<MseLossBackward>)
output :  tensor([[209025.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(8848673., grad_fn=<MseLossBackward>)
output :  tensor([[105926.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7246e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166351.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1317975.7500, grad_fn=<MseLossBackward>)
output :  tensor([[127513.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(236454.2656, grad_fn=<MseLossBackward>)
output :  tensor([[144569.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(5906115., grad_fn=<MseLossBackward>)
output :  tensor([[106092.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9105e+09, grad_fn=<MseLossBackward>)
output :  tensor([[138980.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2192157.7500, grad_fn=<MseLossBackward>)
output :  tensor([[232058.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(15536284., grad_fn=<MseLossBackward>)
output :  tensor([[144922.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(6057.2168, grad_fn=<MseLossBackward>)
output :  tensor([[138898.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1955583.7500, grad_fn=<MseLossBackward>)
output :  tensor([[165239.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3868e+09, grad_fn=<MseLossBackward>)
output :  tensor([[263296.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1619e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172732.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(5143540.5000, grad_fn=<MseLossBackward>)
output :  tensor([[103664.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(789612.7500, grad_fn=<MseLossBackward>)
output :  tensor([[200749.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8906e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163404.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(19399620., grad_fn=<MseLossBackward>)
output :  tensor([[162964.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5994e+10, grad_fn=<MseLossBackward>)
output :  tensor([[98716.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(173836.8750, grad_fn=<MseLossBackward>)
output :  tensor([[123983.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(146928.4688, grad_fn=<MseLossBackward>)
output :  tensor([[158712.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(7358334.5000, grad_fn=<MseLossBackward>)
output :  tensor([[142762.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(7630111.5000, grad_fn=<MseLossBackward>)
output :  tensor([[201411.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1993479.2500, grad_fn=<MseLossBackward>)
output :  tensor([[144455.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(6027101.5000, grad_fn=<MseLossBackward>)
output :  tensor([[258576.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(13713019., grad_fn=<MseLossBackward>)
output :  tensor([[129600.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3396e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166745.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1550764.2500, grad_fn=<MseLossBackward>)
output :  tensor([[188023.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(227260.7656, grad_fn=<MseLossBackward>)
output :  tensor([[124459.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0908e+08, grad_fn=<MseLossBackward>)
output :  tensor([[257241.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(52440000., grad_fn=<MseLossBackward>)
output :  tensor([[158059.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3756e+08, grad_fn=<MseLossBackward>)
output :  tensor([[243855.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2234557.7500, grad_fn=<MseLossBackward>)
output :  tensor([[141756.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(5033993.5000, grad_fn=<MseLossBackward>)
output :  tensor([[211185.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1406077.1250, grad_fn=<MseLossBackward>)
output :  tensor([[177875.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(29986404., grad_fn=<MseLossBackward>)
output :  tensor([[153019.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(960675.6250, grad_fn=<MseLossBackward>)
output :  tensor([[118763.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(582347.8125, grad_fn=<MseLossBackward>)
output :  tensor([[239589.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2563e+09, grad_fn=<MseLossBackward>)
output :  tensor([[238707.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1670233.1250, grad_fn=<MseLossBackward>)
output :  tensor([[153445.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(11846.9619, grad_fn=<MseLossBackward>)
output :  tensor([[255520.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(385000.8750, grad_fn=<MseLossBackward>)
output :  tensor([[122698.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(67148168., grad_fn=<MseLossBackward>)
output :  tensor([[177528.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2336121.2500, grad_fn=<MseLossBackward>)
output :  tensor([[161716.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2944709.7500, grad_fn=<MseLossBackward>)
output :  tensor([[135196.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(17610874., grad_fn=<MseLossBackward>)
output :  tensor([[198314.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7354e+09, grad_fn=<MseLossBackward>)
output :  tensor([[162903.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1202312.2500, grad_fn=<MseLossBackward>)
output :  tensor([[165914.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(8496952., grad_fn=<MseLossBackward>)
output :  tensor([[159077.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1160030., grad_fn=<MseLossBackward>)
output :  tensor([[148652.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1555242.8750, grad_fn=<MseLossBackward>)
output :  tensor([[177810.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6664e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161362.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1856363.6250, grad_fn=<MseLossBackward>)
output :  tensor([[377743.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(38765800., grad_fn=<MseLossBackward>)
output :  tensor([[119310.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(59128652., grad_fn=<MseLossBackward>)
output :  tensor([[128346.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8358e+09, grad_fn=<MseLossBackward>)
output :  tensor([[284582.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(11350372., grad_fn=<MseLossBackward>)
output :  tensor([[162329.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(108457.0156, grad_fn=<MseLossBackward>)
output :  tensor([[131450.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1991e+08, grad_fn=<MseLossBackward>)
output :  tensor([[229803.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(4823720., grad_fn=<MseLossBackward>)
output :  tensor([[177709.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(7787413.5000, grad_fn=<MseLossBackward>)
output :  tensor([[151849.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(22518.7539, grad_fn=<MseLossBackward>)
output :  tensor([[141117.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(15076476., grad_fn=<MseLossBackward>)
output :  tensor([[157513.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2493e+08, grad_fn=<MseLossBackward>)
output :  tensor([[100561.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(314887.5625, grad_fn=<MseLossBackward>)
output :  tensor([[81302.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5381e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163094.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3631049.2500, grad_fn=<MseLossBackward>)
output :  tensor([[184319.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9080e+09, grad_fn=<MseLossBackward>)
output :  tensor([[156713.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1654358.6250, grad_fn=<MseLossBackward>)
output :  tensor([[158461.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(923611.1250, grad_fn=<MseLossBackward>)
output :  tensor([[135855.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2543476.7500, grad_fn=<MseLossBackward>)
output :  tensor([[202879.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(9430849., grad_fn=<MseLossBackward>)
output :  tensor([[137571.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(183224.1250, grad_fn=<MseLossBackward>)
output :  tensor([[180985.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6645e+10, grad_fn=<MseLossBackward>)
output :  tensor([[146375.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(140695.3281, grad_fn=<MseLossBackward>)
output :  tensor([[108477.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4913e+08, grad_fn=<MseLossBackward>)
output :  tensor([[97708.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(13754711., grad_fn=<MseLossBackward>)
output :  tensor([[176594.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2543377., grad_fn=<MseLossBackward>)
output :  tensor([[257709.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(7236604.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139012.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(6186956.5000, grad_fn=<MseLossBackward>)
output :  tensor([[160357.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(213992.9844, grad_fn=<MseLossBackward>)
output :  tensor([[134452.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3814148., grad_fn=<MseLossBackward>)
output :  tensor([[148243.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1579813.3750, grad_fn=<MseLossBackward>)
output :  tensor([[170832.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(8598457., grad_fn=<MseLossBackward>)
output :  tensor([[125272.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(2985579., grad_fn=<MseLossBackward>)
output :  tensor([[175988.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6027e+08, grad_fn=<MseLossBackward>)
output :  tensor([[156476.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(274346.8125, grad_fn=<MseLossBackward>)
output :  tensor([[119257.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(7606090., grad_fn=<MseLossBackward>)
output :  tensor([[161216.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1529e+09, grad_fn=<MseLossBackward>)
output :  tensor([[52036.9492]], grad_fn=<AddmmBackward>)
loss:  tensor(1365.2448, grad_fn=<MseLossBackward>)
output :  tensor([[232028.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4757e+09, grad_fn=<MseLossBackward>)
output :  tensor([[200118.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(776959.6250, grad_fn=<MseLossBackward>)
output :  tensor([[186745.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(3046279.2500, grad_fn=<MseLossBackward>)
output :  tensor([[104413.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2516288.2500, grad_fn=<MseLossBackward>)
output :  tensor([[88197.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(1433538.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144845.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(23480234., grad_fn=<MseLossBackward>)
output :  tensor([[218069.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7654e+09, grad_fn=<MseLossBackward>)
output :  tensor([[199719.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(60542988., grad_fn=<MseLossBackward>)
output :  tensor([[169567.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(20861486., grad_fn=<MseLossBackward>)
output :  tensor([[169627.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(9.0959e+09, grad_fn=<MseLossBackward>)
output :  tensor([[189305.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(482807.8438, grad_fn=<MseLossBackward>)
output :  tensor([[88734.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(3007894., grad_fn=<MseLossBackward>)
output :  tensor([[141406.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1979385.2500, grad_fn=<MseLossBackward>)
output :  tensor([[108983.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(2299819.7500, grad_fn=<MseLossBackward>)
output :  tensor([[148675.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6168e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172425.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7161e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193082.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4202e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176969.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(9185446., grad_fn=<MseLossBackward>)
output :  tensor([[96212.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(82773.0859, grad_fn=<MseLossBackward>)
output :  tensor([[116424.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1156465., grad_fn=<MseLossBackward>)
output :  tensor([[158876.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3118e+08, grad_fn=<MseLossBackward>)
output :  tensor([[202484.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(6171964., grad_fn=<MseLossBackward>)
output :  tensor([[141997.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(4010319.2500, grad_fn=<MseLossBackward>)
train_loss: [2.689147e+09]
epoch_result tensor([0.])
output :  tensor([[159711.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1467543., grad_fn=<MseLossBackward>)
output :  tensor([[121701.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(88962.3828, grad_fn=<MseLossBackward>)
output :  tensor([[194336.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(18415.3379, grad_fn=<MseLossBackward>)
output :  tensor([[180499.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(12243438., grad_fn=<MseLossBackward>)
output :  tensor([[155923.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8736e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128279.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(77845.3594, grad_fn=<MseLossBackward>)
output :  tensor([[139817.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1399008.5000, grad_fn=<MseLossBackward>)
output :  tensor([[117786.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1473492.5000, grad_fn=<MseLossBackward>)
output :  tensor([[69502.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2105e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166270.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(73085.7422, grad_fn=<MseLossBackward>)
output :  tensor([[139895.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(10887.6182, grad_fn=<MseLossBackward>)
output :  tensor([[225624.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(390234.4688, grad_fn=<MseLossBackward>)
output :  tensor([[167941.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1119694.6250, grad_fn=<MseLossBackward>)
output :  tensor([[248421.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1633523.6250, grad_fn=<MseLossBackward>)
output :  tensor([[56779.6680]], grad_fn=<AddmmBackward>)
loss:  tensor(3167218., grad_fn=<MseLossBackward>)
output :  tensor([[164635.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0545e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172462.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(6441285.5000, grad_fn=<MseLossBackward>)
output :  tensor([[151280.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(27245300., grad_fn=<MseLossBackward>)
output :  tensor([[277032.]], grad_fn=<AddmmBackward>)
loss:  tensor(4129024., grad_fn=<MseLossBackward>)
output :  tensor([[197198.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(39309.2578, grad_fn=<MseLossBackward>)
output :  tensor([[136114.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6389e+10, grad_fn=<MseLossBackward>)
output :  tensor([[191993.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(3556347.7500, grad_fn=<MseLossBackward>)
output :  tensor([[176779.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3156e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151485.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(235406.9062, grad_fn=<MseLossBackward>)
output :  tensor([[168025.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(3900316.5000, grad_fn=<MseLossBackward>)
output :  tensor([[85963.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(318060.7500, grad_fn=<MseLossBackward>)
output :  tensor([[167808.]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0039e+09, grad_fn=<MseLossBackward>)
output :  tensor([[184034.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(933125.8125, grad_fn=<MseLossBackward>)
output :  tensor([[205191.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5310e+09, grad_fn=<MseLossBackward>)
output :  tensor([[110763.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(582538.6250, grad_fn=<MseLossBackward>)
output :  tensor([[171125.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(15648.4463, grad_fn=<MseLossBackward>)
output :  tensor([[132829.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(13471882., grad_fn=<MseLossBackward>)
output :  tensor([[130925.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(3708122., grad_fn=<MseLossBackward>)
output :  tensor([[117345.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(4643048.5000, grad_fn=<MseLossBackward>)
output :  tensor([[146736.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8425e+08, grad_fn=<MseLossBackward>)
output :  tensor([[169417.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1194e+10, grad_fn=<MseLossBackward>)
output :  tensor([[151382.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2830490.7500, grad_fn=<MseLossBackward>)
output :  tensor([[181028.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1057073.1250, grad_fn=<MseLossBackward>)
output :  tensor([[142149.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1320991., grad_fn=<MseLossBackward>)
output :  tensor([[104796.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1894e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135823.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2689e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136356.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1840346.6250, grad_fn=<MseLossBackward>)
output :  tensor([[132524.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(30519582., grad_fn=<MseLossBackward>)
output :  tensor([[222909.]], grad_fn=<AddmmBackward>)
loss:  tensor(4372281., grad_fn=<MseLossBackward>)
output :  tensor([[132304.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(3011.2656, grad_fn=<MseLossBackward>)
output :  tensor([[147677.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1747725.3750, grad_fn=<MseLossBackward>)
output :  tensor([[116123.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(17001834., grad_fn=<MseLossBackward>)
output :  tensor([[162809.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(7893729., grad_fn=<MseLossBackward>)
output :  tensor([[144182.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5824e+09, grad_fn=<MseLossBackward>)
output :  tensor([[191009.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(980471.3125, grad_fn=<MseLossBackward>)
output :  tensor([[132977.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2169268.7500, grad_fn=<MseLossBackward>)
output :  tensor([[102278.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(59628560., grad_fn=<MseLossBackward>)
output :  tensor([[229657.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(18859614., grad_fn=<MseLossBackward>)
output :  tensor([[165056.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3458e+09, grad_fn=<MseLossBackward>)
output :  tensor([[152054.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(48238452., grad_fn=<MseLossBackward>)
output :  tensor([[204705.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8155e+10, grad_fn=<MseLossBackward>)
output :  tensor([[241582.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2638e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143969.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(220195.5625, grad_fn=<MseLossBackward>)
output :  tensor([[137808.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(14508005., grad_fn=<MseLossBackward>)
output :  tensor([[158445.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(11873516., grad_fn=<MseLossBackward>)
output :  tensor([[131501.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2253798.5000, grad_fn=<MseLossBackward>)
output :  tensor([[181964.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0895e+09, grad_fn=<MseLossBackward>)
output :  tensor([[182412.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2849185.7500, grad_fn=<MseLossBackward>)
output :  tensor([[164522.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(9136829., grad_fn=<MseLossBackward>)
output :  tensor([[142473.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(277547.8750, grad_fn=<MseLossBackward>)
output :  tensor([[142937.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(191378.9062, grad_fn=<MseLossBackward>)
output :  tensor([[143854.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1312385., grad_fn=<MseLossBackward>)
output :  tensor([[173410.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3925e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193418.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5607e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137558.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1121282.5000, grad_fn=<MseLossBackward>)
output :  tensor([[174331.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(5910293., grad_fn=<MseLossBackward>)
output :  tensor([[175699.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(28098116., grad_fn=<MseLossBackward>)
output :  tensor([[116064.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1133592.7500, grad_fn=<MseLossBackward>)
output :  tensor([[218140.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(8178795.5000, grad_fn=<MseLossBackward>)
output :  tensor([[184980.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2192666.7500, grad_fn=<MseLossBackward>)
output :  tensor([[124343.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1336805.6250, grad_fn=<MseLossBackward>)
output :  tensor([[199704.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(10266317., grad_fn=<MseLossBackward>)
output :  tensor([[173995.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(817639.8125, grad_fn=<MseLossBackward>)
output :  tensor([[207205.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2057e+10, grad_fn=<MseLossBackward>)
output :  tensor([[208399.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(6764876., grad_fn=<MseLossBackward>)
output :  tensor([[169448.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4783e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194012.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(237884.8281, grad_fn=<MseLossBackward>)
output :  tensor([[114298.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(1686528.3750, grad_fn=<MseLossBackward>)
output :  tensor([[114595.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(4390465.5000, grad_fn=<MseLossBackward>)
output :  tensor([[113699.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2888034.7500, grad_fn=<MseLossBackward>)
output :  tensor([[146733.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(4386.9922, grad_fn=<MseLossBackward>)
output :  tensor([[159939.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3381e+10, grad_fn=<MseLossBackward>)
output :  tensor([[177527.]], grad_fn=<AddmmBackward>)
loss:  tensor(6115729., grad_fn=<MseLossBackward>)
output :  tensor([[127907.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(166387.5156, grad_fn=<MseLossBackward>)
output :  tensor([[145906.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(821487.3125, grad_fn=<MseLossBackward>)
output :  tensor([[188190.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8399e+09, grad_fn=<MseLossBackward>)
output :  tensor([[116431.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(219111.7656, grad_fn=<MseLossBackward>)
output :  tensor([[190835.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(38005684., grad_fn=<MseLossBackward>)
output :  tensor([[144352.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(419883.7500, grad_fn=<MseLossBackward>)
output :  tensor([[215296.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(5741789.5000, grad_fn=<MseLossBackward>)
output :  tensor([[125951.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(2310.7549, grad_fn=<MseLossBackward>)
output :  tensor([[243407.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(24212090., grad_fn=<MseLossBackward>)
output :  tensor([[235284.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4716e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150766.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7505e+08, grad_fn=<MseLossBackward>)
output :  tensor([[85912.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2064e+08, grad_fn=<MseLossBackward>)
output :  tensor([[190578.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1101e+09, grad_fn=<MseLossBackward>)
output :  tensor([[77143.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(14872170., grad_fn=<MseLossBackward>)
output :  tensor([[141153.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2732460.7500, grad_fn=<MseLossBackward>)
output :  tensor([[74437.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(1129088.8750, grad_fn=<MseLossBackward>)
output :  tensor([[144567.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2606408.5000, grad_fn=<MseLossBackward>)
output :  tensor([[175254.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(555653.7500, grad_fn=<MseLossBackward>)
output :  tensor([[153870.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(136934.6875, grad_fn=<MseLossBackward>)
output :  tensor([[108184.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(616188.1875, grad_fn=<MseLossBackward>)
output :  tensor([[204458.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2386e+10, grad_fn=<MseLossBackward>)
output :  tensor([[126410.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(4365324.5000, grad_fn=<MseLossBackward>)
output :  tensor([[267165.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6472e+08, grad_fn=<MseLossBackward>)
output :  tensor([[302187.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(61041504., grad_fn=<MseLossBackward>)
output :  tensor([[107063.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(190716.4375, grad_fn=<MseLossBackward>)
output :  tensor([[170481.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(4075540.7500, grad_fn=<MseLossBackward>)
output :  tensor([[133074.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2873e+08, grad_fn=<MseLossBackward>)
output :  tensor([[140881.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(3540277.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128708.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(2375861., grad_fn=<MseLossBackward>)
output :  tensor([[130217.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(27221002., grad_fn=<MseLossBackward>)
output :  tensor([[134255.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1283e+08, grad_fn=<MseLossBackward>)
output :  tensor([[226249.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8711e+10, grad_fn=<MseLossBackward>)
output :  tensor([[185682.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4124e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144168.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(71932.9141, grad_fn=<MseLossBackward>)
output :  tensor([[127631.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(17214.2598, grad_fn=<MseLossBackward>)
output :  tensor([[112443.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(1425132.3750, grad_fn=<MseLossBackward>)
output :  tensor([[253845.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1236e+09, grad_fn=<MseLossBackward>)
output :  tensor([[134158.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(707727.8750, grad_fn=<MseLossBackward>)
output :  tensor([[204695.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2875197.2500, grad_fn=<MseLossBackward>)
output :  tensor([[104589.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(96153.2891, grad_fn=<MseLossBackward>)
output :  tensor([[139024.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(856000.8125, grad_fn=<MseLossBackward>)
output :  tensor([[206098.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3862e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180052.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(23346.8848, grad_fn=<MseLossBackward>)
output :  tensor([[188351.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(11233076., grad_fn=<MseLossBackward>)
output :  tensor([[163512.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1167e+10, grad_fn=<MseLossBackward>)
output :  tensor([[295020.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5983e+09, grad_fn=<MseLossBackward>)
output :  tensor([[200109.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(4882788., grad_fn=<MseLossBackward>)
output :  tensor([[259785.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0470e+10, grad_fn=<MseLossBackward>)
output :  tensor([[218111.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2933e+09, grad_fn=<MseLossBackward>)
output :  tensor([[274686.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7904e+09, grad_fn=<MseLossBackward>)
output :  tensor([[221195.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(7862766.5000, grad_fn=<MseLossBackward>)
output :  tensor([[220334.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9469e+10, grad_fn=<MseLossBackward>)
output :  tensor([[195849.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1322536., grad_fn=<MseLossBackward>)
output :  tensor([[160036.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6327e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134751.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(5068267.5000, grad_fn=<MseLossBackward>)
output :  tensor([[137158.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2749015.7500, grad_fn=<MseLossBackward>)
output :  tensor([[90266.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(537724.3125, grad_fn=<MseLossBackward>)
output :  tensor([[106865.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1286948.5000, grad_fn=<MseLossBackward>)
output :  tensor([[273351.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0856e+09, grad_fn=<MseLossBackward>)
output :  tensor([[234403.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(355737.6875, grad_fn=<MseLossBackward>)
output :  tensor([[143826.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1376368.8750, grad_fn=<MseLossBackward>)
output :  tensor([[137439.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(3696.2600, grad_fn=<MseLossBackward>)
output :  tensor([[174614.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(777896.4375, grad_fn=<MseLossBackward>)
output :  tensor([[144162.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1183540., grad_fn=<MseLossBackward>)
output :  tensor([[161964.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0586e+09, grad_fn=<MseLossBackward>)
output :  tensor([[167861.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(8186125.5000, grad_fn=<MseLossBackward>)
output :  tensor([[137126.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(15966.6914, grad_fn=<MseLossBackward>)
output :  tensor([[190889.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6771e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113930.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(3725714.2500, grad_fn=<MseLossBackward>)
output :  tensor([[171914.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(7246.2656, grad_fn=<MseLossBackward>)
output :  tensor([[119340.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(434837.2188, grad_fn=<MseLossBackward>)
output :  tensor([[87273.]], grad_fn=<AddmmBackward>)
loss:  tensor(74529., grad_fn=<MseLossBackward>)
output :  tensor([[179818.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(33010.3477, grad_fn=<MseLossBackward>)
output :  tensor([[114792.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(23940072., grad_fn=<MseLossBackward>)
output :  tensor([[241165.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(4689390., grad_fn=<MseLossBackward>)
output :  tensor([[247252.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(5074742., grad_fn=<MseLossBackward>)
output :  tensor([[128549.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(902841.4375, grad_fn=<MseLossBackward>)
output :  tensor([[107649.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1714340.1250, grad_fn=<MseLossBackward>)
output :  tensor([[286052.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2832e+10, grad_fn=<MseLossBackward>)
output :  tensor([[173669.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(4705578., grad_fn=<MseLossBackward>)
output :  tensor([[125912.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(831943.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144678.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1177e+08, grad_fn=<MseLossBackward>)
output :  tensor([[198247.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4814e+08, grad_fn=<MseLossBackward>)
output :  tensor([[138813.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(4782695.5000, grad_fn=<MseLossBackward>)
output :  tensor([[157343.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5045e+10, grad_fn=<MseLossBackward>)
output :  tensor([[156590.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(7237445., grad_fn=<MseLossBackward>)
output :  tensor([[129484.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(226.8789, grad_fn=<MseLossBackward>)
output :  tensor([[243455.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8237e+10, grad_fn=<MseLossBackward>)
output :  tensor([[389715.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5092e+08, grad_fn=<MseLossBackward>)
output :  tensor([[111061.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(4249009., grad_fn=<MseLossBackward>)
output :  tensor([[123018.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(20419172., grad_fn=<MseLossBackward>)
output :  tensor([[160987.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2214097.5000, grad_fn=<MseLossBackward>)
output :  tensor([[134444.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8241e+08, grad_fn=<MseLossBackward>)
output :  tensor([[162728.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5132e+09, grad_fn=<MseLossBackward>)
output :  tensor([[176908.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4767e+09, grad_fn=<MseLossBackward>)
output :  tensor([[106249.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(7021961.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140050.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(902203.1250, grad_fn=<MseLossBackward>)
output :  tensor([[364117.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(10088167., grad_fn=<MseLossBackward>)
output :  tensor([[199799.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9377e+09, grad_fn=<MseLossBackward>)
output :  tensor([[175332.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(27998.7012, grad_fn=<MseLossBackward>)
output :  tensor([[203651.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(565175.0625, grad_fn=<MseLossBackward>)
output :  tensor([[140822.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(3322018.7500, grad_fn=<MseLossBackward>)
output :  tensor([[193288.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1468830.3750, grad_fn=<MseLossBackward>)
output :  tensor([[138952.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(9.8928e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179202.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(3232523., grad_fn=<MseLossBackward>)
output :  tensor([[238932.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(9407927., grad_fn=<MseLossBackward>)
output :  tensor([[173675.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(105057.0156, grad_fn=<MseLossBackward>)
output :  tensor([[109727.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2983176.7500, grad_fn=<MseLossBackward>)
output :  tensor([[265603.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1086350.2500, grad_fn=<MseLossBackward>)
output :  tensor([[255251.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(27582356., grad_fn=<MseLossBackward>)
output :  tensor([[121656.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(1805265.1250, grad_fn=<MseLossBackward>)
output :  tensor([[215183.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5780e+09, grad_fn=<MseLossBackward>)
output :  tensor([[300472.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1641e+08, grad_fn=<MseLossBackward>)
output :  tensor([[209690.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(7239042.5000, grad_fn=<MseLossBackward>)
output :  tensor([[215016.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5621e+10, grad_fn=<MseLossBackward>)
output :  tensor([[160056.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(4650829., grad_fn=<MseLossBackward>)
output :  tensor([[177431.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(55373596., grad_fn=<MseLossBackward>)
output :  tensor([[164050.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(50667036., grad_fn=<MseLossBackward>)
output :  tensor([[170502.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(252207.9844, grad_fn=<MseLossBackward>)
output :  tensor([[231601.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3248e+09, grad_fn=<MseLossBackward>)
output :  tensor([[212700.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8073e+08, grad_fn=<MseLossBackward>)
output :  tensor([[162458.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3897e+08, grad_fn=<MseLossBackward>)
output :  tensor([[121181.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(3305891., grad_fn=<MseLossBackward>)
output :  tensor([[174995.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4019523.7500, grad_fn=<MseLossBackward>)
output :  tensor([[180272.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3564e+09, grad_fn=<MseLossBackward>)
output :  tensor([[205662.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5704e+10, grad_fn=<MseLossBackward>)
output :  tensor([[136067.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2674655.7500, grad_fn=<MseLossBackward>)
output :  tensor([[152236.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(9.3858e+08, grad_fn=<MseLossBackward>)
output :  tensor([[272545.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(19842848., grad_fn=<MseLossBackward>)
output :  tensor([[88864.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(14934481., grad_fn=<MseLossBackward>)
output :  tensor([[235410.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1187589.1250, grad_fn=<MseLossBackward>)
output :  tensor([[257402.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0597e+11, grad_fn=<MseLossBackward>)
output :  tensor([[171716.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2945460.5000, grad_fn=<MseLossBackward>)
output :  tensor([[190155.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0111e+09, grad_fn=<MseLossBackward>)
output :  tensor([[153266.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3005835., grad_fn=<MseLossBackward>)
output :  tensor([[204754.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2570e+09, grad_fn=<MseLossBackward>)
output :  tensor([[129867.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(753207., grad_fn=<MseLossBackward>)
output :  tensor([[144962.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1374.7874, grad_fn=<MseLossBackward>)
output :  tensor([[171064.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1592e+08, grad_fn=<MseLossBackward>)
output :  tensor([[187469.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2623387.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128835.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(8040193., grad_fn=<MseLossBackward>)
output :  tensor([[136299.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(40369.6016, grad_fn=<MseLossBackward>)
output :  tensor([[172552.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(199822.9688, grad_fn=<MseLossBackward>)
output :  tensor([[199684.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5316e+09, grad_fn=<MseLossBackward>)
output :  tensor([[239023.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(15810688., grad_fn=<MseLossBackward>)
output :  tensor([[151565.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(11793751., grad_fn=<MseLossBackward>)
output :  tensor([[200785.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(22897870., grad_fn=<MseLossBackward>)
output :  tensor([[165944.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8158e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177204.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(5270037.5000, grad_fn=<MseLossBackward>)
output :  tensor([[182415.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(6329312.5000, grad_fn=<MseLossBackward>)
output :  tensor([[96844.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(24316.5039, grad_fn=<MseLossBackward>)
output :  tensor([[172803.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1491e+10, grad_fn=<MseLossBackward>)
output :  tensor([[132968.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(4128262., grad_fn=<MseLossBackward>)
output :  tensor([[123034.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(64548296., grad_fn=<MseLossBackward>)
output :  tensor([[175019.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1039029.8125, grad_fn=<MseLossBackward>)
output :  tensor([[84828.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(29291.7871, grad_fn=<MseLossBackward>)
output :  tensor([[281576.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(70956928., grad_fn=<MseLossBackward>)
output :  tensor([[166963.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3854412., grad_fn=<MseLossBackward>)
output :  tensor([[190895.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0242e+10, grad_fn=<MseLossBackward>)
output :  tensor([[242467.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1409e+08, grad_fn=<MseLossBackward>)
output :  tensor([[154668.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(13460758., grad_fn=<MseLossBackward>)
output :  tensor([[122558.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(2076503.5000, grad_fn=<MseLossBackward>)
output :  tensor([[122506.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(6792783.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145505.]], grad_fn=<AddmmBackward>)
loss:  tensor(9.3056e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177375.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(11392313., grad_fn=<MseLossBackward>)
output :  tensor([[114901.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0499e+09, grad_fn=<MseLossBackward>)
output :  tensor([[208842.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1915e+10, grad_fn=<MseLossBackward>)
output :  tensor([[235153.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(40278064., grad_fn=<MseLossBackward>)
output :  tensor([[249368.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1264e+10, grad_fn=<MseLossBackward>)
output :  tensor([[223088.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5319e+08, grad_fn=<MseLossBackward>)
output :  tensor([[195364.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4433e+10, grad_fn=<MseLossBackward>)
output :  tensor([[188132.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(399838.8438, grad_fn=<MseLossBackward>)
output :  tensor([[206543.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7666e+10, grad_fn=<MseLossBackward>)
output :  tensor([[189408.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1489e+10, grad_fn=<MseLossBackward>)
output :  tensor([[182478.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(13973228., grad_fn=<MseLossBackward>)
output :  tensor([[153964.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3859137.5000, grad_fn=<MseLossBackward>)
output :  tensor([[338008.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1017954.8750, grad_fn=<MseLossBackward>)
output :  tensor([[212557.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(311311.6875, grad_fn=<MseLossBackward>)
output :  tensor([[161077.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1160602.2500, grad_fn=<MseLossBackward>)
output :  tensor([[183925.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3148e+09, grad_fn=<MseLossBackward>)
output :  tensor([[107849.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(8119427.5000, grad_fn=<MseLossBackward>)
output :  tensor([[271232.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0524e+10, grad_fn=<MseLossBackward>)
output :  tensor([[170166.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(13936339., grad_fn=<MseLossBackward>)
output :  tensor([[206739.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(45700136., grad_fn=<MseLossBackward>)
output :  tensor([[202851.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2935e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176589.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(6815118., grad_fn=<MseLossBackward>)
output :  tensor([[198250.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(12602056., grad_fn=<MseLossBackward>)
output :  tensor([[158321.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(11032674., grad_fn=<MseLossBackward>)
output :  tensor([[150381.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5383e+09, grad_fn=<MseLossBackward>)
output :  tensor([[118985.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(235414.4844, grad_fn=<MseLossBackward>)
output :  tensor([[139853.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(21334.2539, grad_fn=<MseLossBackward>)
output :  tensor([[151632.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(6932606.5000, grad_fn=<MseLossBackward>)
output :  tensor([[200031.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6376e+10, grad_fn=<MseLossBackward>)
output :  tensor([[161981.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(6159703.5000, grad_fn=<MseLossBackward>)
output :  tensor([[100582.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1172347.5000, grad_fn=<MseLossBackward>)
output :  tensor([[223375.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7639e+08, grad_fn=<MseLossBackward>)
output :  tensor([[187066.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6510e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176182.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(91562.9766, grad_fn=<MseLossBackward>)
output :  tensor([[83587.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2519709.7500, grad_fn=<MseLossBackward>)
output :  tensor([[130704.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(4860819., grad_fn=<MseLossBackward>)
output :  tensor([[214960.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(922170.0625, grad_fn=<MseLossBackward>)
output :  tensor([[143877.]], grad_fn=<AddmmBackward>)
loss:  tensor(15129., grad_fn=<MseLossBackward>)
output :  tensor([[132034.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4137219.5000, grad_fn=<MseLossBackward>)
output :  tensor([[143557.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(917135.4375, grad_fn=<MseLossBackward>)
output :  tensor([[181002.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8925e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145040.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1083290.6250, grad_fn=<MseLossBackward>)
output :  tensor([[158702.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1682695.3750, grad_fn=<MseLossBackward>)
output :  tensor([[212003.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(8980042., grad_fn=<MseLossBackward>)
output :  tensor([[138488.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1215e+09, grad_fn=<MseLossBackward>)
output :  tensor([[255690.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(477135.5625, grad_fn=<MseLossBackward>)
output :  tensor([[160030.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(281927.8125, grad_fn=<MseLossBackward>)
output :  tensor([[128531.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1010.0479, grad_fn=<MseLossBackward>)
output :  tensor([[95544.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(296284.5938, grad_fn=<MseLossBackward>)
output :  tensor([[150679.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3797e+09, grad_fn=<MseLossBackward>)
output :  tensor([[179642.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(66282.1094, grad_fn=<MseLossBackward>)
output :  tensor([[120340.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(25565.0117, grad_fn=<MseLossBackward>)
output :  tensor([[188586.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6292e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146985.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5542e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150686.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(618385.6250, grad_fn=<MseLossBackward>)
output :  tensor([[188325.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(331038.4062, grad_fn=<MseLossBackward>)
output :  tensor([[251436.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7339e+09, grad_fn=<MseLossBackward>)
output :  tensor([[94177.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(7170554.5000, grad_fn=<MseLossBackward>)
output :  tensor([[236258.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(13997536., grad_fn=<MseLossBackward>)
output :  tensor([[125693.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(7874600.5000, grad_fn=<MseLossBackward>)
output :  tensor([[167410.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(9.7001e+09, grad_fn=<MseLossBackward>)
output :  tensor([[116050.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5763e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177174.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1379303.5000, grad_fn=<MseLossBackward>)
output :  tensor([[164553.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3272e+08, grad_fn=<MseLossBackward>)
output :  tensor([[154939.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9730e+08, grad_fn=<MseLossBackward>)
output :  tensor([[241195.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(4819397., grad_fn=<MseLossBackward>)
output :  tensor([[227507.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2978e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128255.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1575495.6250, grad_fn=<MseLossBackward>)
output :  tensor([[131636.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(31768018., grad_fn=<MseLossBackward>)
output :  tensor([[225856.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1308199.7500, grad_fn=<MseLossBackward>)
output :  tensor([[231669.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(5429555.5000, grad_fn=<MseLossBackward>)
output :  tensor([[231018.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(18645934., grad_fn=<MseLossBackward>)
output :  tensor([[146181.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(3305805.7500, grad_fn=<MseLossBackward>)
output :  tensor([[203582.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(41187916., grad_fn=<MseLossBackward>)
output :  tensor([[128786.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(77194896., grad_fn=<MseLossBackward>)
output :  tensor([[134187.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2847287., grad_fn=<MseLossBackward>)
output :  tensor([[308731.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(39290176., grad_fn=<MseLossBackward>)
output :  tensor([[138034.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(8796971., grad_fn=<MseLossBackward>)
output :  tensor([[120582.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8711e+09, grad_fn=<MseLossBackward>)
output :  tensor([[107937.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(2439966., grad_fn=<MseLossBackward>)
output :  tensor([[155421.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9169e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177920.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(9.3712e+09, grad_fn=<MseLossBackward>)
output :  tensor([[169743.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(10605403., grad_fn=<MseLossBackward>)
output :  tensor([[188961.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4492e+08, grad_fn=<MseLossBackward>)
output :  tensor([[96652.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(11208947., grad_fn=<MseLossBackward>)
output :  tensor([[179091.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(8303.7656, grad_fn=<MseLossBackward>)
output :  tensor([[166098.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3244107.5000, grad_fn=<MseLossBackward>)
output :  tensor([[141305.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(5314177.5000, grad_fn=<MseLossBackward>)
output :  tensor([[259813.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(9.8579e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144390.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5272e+09, grad_fn=<MseLossBackward>)
output :  tensor([[171755.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1549519.2500, grad_fn=<MseLossBackward>)
output :  tensor([[136653.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(11199376., grad_fn=<MseLossBackward>)
output :  tensor([[197365.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(9823327., grad_fn=<MseLossBackward>)
output :  tensor([[169746.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(64381.1328, grad_fn=<MseLossBackward>)
output :  tensor([[242569.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2045793.8750, grad_fn=<MseLossBackward>)
output :  tensor([[134221.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(77588.3594, grad_fn=<MseLossBackward>)
output :  tensor([[152461.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(9684155., grad_fn=<MseLossBackward>)
output :  tensor([[213718.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1642602.7500, grad_fn=<MseLossBackward>)
output :  tensor([[161699.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(10890516., grad_fn=<MseLossBackward>)
output :  tensor([[196304.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(53360972., grad_fn=<MseLossBackward>)
output :  tensor([[134938.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7898e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131821.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(7959716., grad_fn=<MseLossBackward>)
output :  tensor([[134556.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(29633564., grad_fn=<MseLossBackward>)
output :  tensor([[198132.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0933e+09, grad_fn=<MseLossBackward>)
output :  tensor([[168776.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8919e+09, grad_fn=<MseLossBackward>)
output :  tensor([[78348.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3667e+08, grad_fn=<MseLossBackward>)
output :  tensor([[95541.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2192e+08, grad_fn=<MseLossBackward>)
output :  tensor([[251548.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3041808.5000, grad_fn=<MseLossBackward>)
output :  tensor([[200894.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8309e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113944.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(1113964.7500, grad_fn=<MseLossBackward>)
output :  tensor([[159674.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7424e+08, grad_fn=<MseLossBackward>)
output :  tensor([[205106.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2181e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179032.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2750e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157366.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(5600248.5000, grad_fn=<MseLossBackward>)
output :  tensor([[167694.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(5315258., grad_fn=<MseLossBackward>)
output :  tensor([[117250.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(5063168., grad_fn=<MseLossBackward>)
output :  tensor([[166193.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2530e+08, grad_fn=<MseLossBackward>)
output :  tensor([[194517.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5332e+08, grad_fn=<MseLossBackward>)
output :  tensor([[222902.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(11577325., grad_fn=<MseLossBackward>)
output :  tensor([[242734.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5227e+11, grad_fn=<MseLossBackward>)
output :  tensor([[146370.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(395876.9062, grad_fn=<MseLossBackward>)
output :  tensor([[109285.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(648566., grad_fn=<MseLossBackward>)
output :  tensor([[168426.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8153e+08, grad_fn=<MseLossBackward>)
output :  tensor([[152709.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(4882580.5000, grad_fn=<MseLossBackward>)
output :  tensor([[229299.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(59290480., grad_fn=<MseLossBackward>)
output :  tensor([[114689.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(96371.4375, grad_fn=<MseLossBackward>)
output :  tensor([[181276.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2634433.2500, grad_fn=<MseLossBackward>)
output :  tensor([[184811.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(3565311., grad_fn=<MseLossBackward>)
output :  tensor([[166338.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3612e+10, grad_fn=<MseLossBackward>)
output :  tensor([[96523.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4097e+08, grad_fn=<MseLossBackward>)
output :  tensor([[235310.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(13608952., grad_fn=<MseLossBackward>)
output :  tensor([[178720.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(7401800.5000, grad_fn=<MseLossBackward>)
output :  tensor([[141703.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2903243.2500, grad_fn=<MseLossBackward>)
output :  tensor([[236119.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1253140.3750, grad_fn=<MseLossBackward>)
output :  tensor([[164517.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2303375.2500, grad_fn=<MseLossBackward>)
output :  tensor([[199187.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5829e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134896.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(10725.1914, grad_fn=<MseLossBackward>)
output :  tensor([[185481.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5140e+08, grad_fn=<MseLossBackward>)
output :  tensor([[138726.]], grad_fn=<AddmmBackward>)
loss:  tensor(7431076., grad_fn=<MseLossBackward>)
output :  tensor([[223681.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5174e+08, grad_fn=<MseLossBackward>)
output :  tensor([[223966.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7772e+08, grad_fn=<MseLossBackward>)
output :  tensor([[91548.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2398384.5000, grad_fn=<MseLossBackward>)
output :  tensor([[160694.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1589569.3750, grad_fn=<MseLossBackward>)
output :  tensor([[245277.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5776e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145369.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(136888.4375, grad_fn=<MseLossBackward>)
output :  tensor([[110208.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8670e+09, grad_fn=<MseLossBackward>)
output :  tensor([[162931.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2460927.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140942.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(9349262., grad_fn=<MseLossBackward>)
output :  tensor([[130656.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(6035121.5000, grad_fn=<MseLossBackward>)
output :  tensor([[191555.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5488e+09, grad_fn=<MseLossBackward>)
output :  tensor([[124064.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(2449102.7500, grad_fn=<MseLossBackward>)
output :  tensor([[153700.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2892338., grad_fn=<MseLossBackward>)
output :  tensor([[170184.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2449714., grad_fn=<MseLossBackward>)
output :  tensor([[151435.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(189360.9688, grad_fn=<MseLossBackward>)
output :  tensor([[160520.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(5662838., grad_fn=<MseLossBackward>)
output :  tensor([[136065.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3254e+08, grad_fn=<MseLossBackward>)
output :  tensor([[132369.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(136668.8438, grad_fn=<MseLossBackward>)
output :  tensor([[155592.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7529e+08, grad_fn=<MseLossBackward>)
output :  tensor([[145395.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1546952.8750, grad_fn=<MseLossBackward>)
output :  tensor([[162904.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1333195., grad_fn=<MseLossBackward>)
output :  tensor([[141478.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9721e+08, grad_fn=<MseLossBackward>)
output :  tensor([[147380.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2015601.3750, grad_fn=<MseLossBackward>)
output :  tensor([[184544.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(11942856., grad_fn=<MseLossBackward>)
output :  tensor([[169538.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(289528.0625, grad_fn=<MseLossBackward>)
output :  tensor([[180077.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(5989.3086, grad_fn=<MseLossBackward>)
output :  tensor([[220990.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(980223.7500, grad_fn=<MseLossBackward>)
output :  tensor([[111086.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(10151293., grad_fn=<MseLossBackward>)
output :  tensor([[138077.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7364e+08, grad_fn=<MseLossBackward>)
output :  tensor([[286110.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(12113.7539, grad_fn=<MseLossBackward>)
output :  tensor([[114764.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(1525939.1250, grad_fn=<MseLossBackward>)
output :  tensor([[175259.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0017e+09, grad_fn=<MseLossBackward>)
output :  tensor([[184276.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(523113.1562, grad_fn=<MseLossBackward>)
output :  tensor([[179234.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(39252964., grad_fn=<MseLossBackward>)
output :  tensor([[250425.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0388e+08, grad_fn=<MseLossBackward>)
output :  tensor([[221444.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(308441.3750, grad_fn=<MseLossBackward>)
output :  tensor([[132326.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9835e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177657.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0800e+08, grad_fn=<MseLossBackward>)
output :  tensor([[122738.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1591934.2500, grad_fn=<MseLossBackward>)
output :  tensor([[182303.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5780e+10, grad_fn=<MseLossBackward>)
output :  tensor([[150083.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(8508616., grad_fn=<MseLossBackward>)
output :  tensor([[153924.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(55118792., grad_fn=<MseLossBackward>)
output :  tensor([[202397.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(15230116., grad_fn=<MseLossBackward>)
output :  tensor([[145686.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7389e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175717.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(79559.2500, grad_fn=<MseLossBackward>)
output :  tensor([[247246.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0403e+09, grad_fn=<MseLossBackward>)
output :  tensor([[147981.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(345.7275, grad_fn=<MseLossBackward>)
output :  tensor([[207310.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(21579654., grad_fn=<MseLossBackward>)
output :  tensor([[167403.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(55556292., grad_fn=<MseLossBackward>)
output :  tensor([[126897.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5130e+09, grad_fn=<MseLossBackward>)
output :  tensor([[134140.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2591043.5000, grad_fn=<MseLossBackward>)
output :  tensor([[184362.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(131576.2344, grad_fn=<MseLossBackward>)
output :  tensor([[195061.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(25615778., grad_fn=<MseLossBackward>)
output :  tensor([[214209.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5936e+09, grad_fn=<MseLossBackward>)
output :  tensor([[255891.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1228806.8750, grad_fn=<MseLossBackward>)
output :  tensor([[183668.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8315e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144534.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8126e+09, grad_fn=<MseLossBackward>)
output :  tensor([[141765.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(7477832., grad_fn=<MseLossBackward>)
output :  tensor([[73540.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1250e+09, grad_fn=<MseLossBackward>)
output :  tensor([[127353.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(58467052., grad_fn=<MseLossBackward>)
output :  tensor([[131244.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(5494849., grad_fn=<MseLossBackward>)
output :  tensor([[152788.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1468375.8750, grad_fn=<MseLossBackward>)
output :  tensor([[129757.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(7601092., grad_fn=<MseLossBackward>)
output :  tensor([[75645.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(729636.3125, grad_fn=<MseLossBackward>)
output :  tensor([[83393.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(1941951.1250, grad_fn=<MseLossBackward>)
output :  tensor([[230243.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(3086005.7500, grad_fn=<MseLossBackward>)
output :  tensor([[140657.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9287e+08, grad_fn=<MseLossBackward>)
output :  tensor([[125955.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(20651344., grad_fn=<MseLossBackward>)
output :  tensor([[169346.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(5508262.5000, grad_fn=<MseLossBackward>)
output :  tensor([[235509.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(259590.2500, grad_fn=<MseLossBackward>)
output :  tensor([[185203.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(48108528., grad_fn=<MseLossBackward>)
output :  tensor([[156490.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(241004.2812, grad_fn=<MseLossBackward>)
output :  tensor([[192855.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(25448556., grad_fn=<MseLossBackward>)
output :  tensor([[196913.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6069e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136702.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(88236.8438, grad_fn=<MseLossBackward>)
output :  tensor([[156460.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2134155.7500, grad_fn=<MseLossBackward>)
output :  tensor([[136672.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(451773.0312, grad_fn=<MseLossBackward>)
output :  tensor([[196570.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1176e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157302.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(10904649., grad_fn=<MseLossBackward>)
output :  tensor([[139013.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0715e+09, grad_fn=<MseLossBackward>)
output :  tensor([[148556.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(13367936., grad_fn=<MseLossBackward>)
output :  tensor([[206784.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(27198506., grad_fn=<MseLossBackward>)
output :  tensor([[104621.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1173e+08, grad_fn=<MseLossBackward>)
output :  tensor([[168903.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1968979., grad_fn=<MseLossBackward>)
output :  tensor([[130086.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(4353189., grad_fn=<MseLossBackward>)
output :  tensor([[144685.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(5357561., grad_fn=<MseLossBackward>)
output :  tensor([[104390.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7646e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137187.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(97539.0938, grad_fn=<MseLossBackward>)
output :  tensor([[234848.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1325232.6250, grad_fn=<MseLossBackward>)
output :  tensor([[146775.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(3151679., grad_fn=<MseLossBackward>)
output :  tensor([[140077.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(6645842.5000, grad_fn=<MseLossBackward>)
output :  tensor([[165019.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3704e+09, grad_fn=<MseLossBackward>)
output :  tensor([[262029.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5505e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178033.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(9200700., grad_fn=<MseLossBackward>)
output :  tensor([[105447.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(7134825.5000, grad_fn=<MseLossBackward>)
output :  tensor([[200177.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9787e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158987.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(148.9163, grad_fn=<MseLossBackward>)
output :  tensor([[163621.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5712e+10, grad_fn=<MseLossBackward>)
output :  tensor([[100203.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(3624442.5000, grad_fn=<MseLossBackward>)
output :  tensor([[123208.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(153480.3125, grad_fn=<MseLossBackward>)
output :  tensor([[158284.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(5220511., grad_fn=<MseLossBackward>)
output :  tensor([[142935.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(8619179., grad_fn=<MseLossBackward>)
output :  tensor([[199911.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(7859.9307, grad_fn=<MseLossBackward>)
output :  tensor([[141516.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(234104.7812, grad_fn=<MseLossBackward>)
output :  tensor([[261285.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(988253.4375, grad_fn=<MseLossBackward>)
output :  tensor([[129378.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3234e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166440.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(885245.7500, grad_fn=<MseLossBackward>)
output :  tensor([[189042.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(293831.7500, grad_fn=<MseLossBackward>)
output :  tensor([[122297.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5124e+08, grad_fn=<MseLossBackward>)
output :  tensor([[252252.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(5074953., grad_fn=<MseLossBackward>)
output :  tensor([[159512.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5554e+08, grad_fn=<MseLossBackward>)
output :  tensor([[244367.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(966104.6875, grad_fn=<MseLossBackward>)
output :  tensor([[144315.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(99451.5391, grad_fn=<MseLossBackward>)
output :  tensor([[210273.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(74580.1953, grad_fn=<MseLossBackward>)
output :  tensor([[175683.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(10783732., grad_fn=<MseLossBackward>)
output :  tensor([[152449.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2404438., grad_fn=<MseLossBackward>)
output :  tensor([[118943.4922]], grad_fn=<AddmmBackward>)
loss:  tensor(890177.5000, grad_fn=<MseLossBackward>)
output :  tensor([[238353.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3752e+09, grad_fn=<MseLossBackward>)
output :  tensor([[237990.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(4039409., grad_fn=<MseLossBackward>)
output :  tensor([[153756.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(175731.2656, grad_fn=<MseLossBackward>)
output :  tensor([[253169.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2993008.2500, grad_fn=<MseLossBackward>)
output :  tensor([[121545.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(49589652., grad_fn=<MseLossBackward>)
output :  tensor([[175940.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(3538.3909, grad_fn=<MseLossBackward>)
output :  tensor([[160524.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(275198.5938, grad_fn=<MseLossBackward>)
output :  tensor([[128916.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(4342209.5000, grad_fn=<MseLossBackward>)
output :  tensor([[197174.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5799e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163002.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(995037.4375, grad_fn=<MseLossBackward>)
output :  tensor([[160024.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(8854623., grad_fn=<MseLossBackward>)
output :  tensor([[157603.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(157522.1719, grad_fn=<MseLossBackward>)
output :  tensor([[153713.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(14543259., grad_fn=<MseLossBackward>)
output :  tensor([[174861.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2721e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159480.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(270318.7500, grad_fn=<MseLossBackward>)
output :  tensor([[375526.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(71296912., grad_fn=<MseLossBackward>)
output :  tensor([[131858.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(23603504., grad_fn=<MseLossBackward>)
output :  tensor([[127658.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7774e+09, grad_fn=<MseLossBackward>)
output :  tensor([[280151.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1127180.3750, grad_fn=<MseLossBackward>)
output :  tensor([[161028.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(944662.5000, grad_fn=<MseLossBackward>)
output :  tensor([[131654.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2443e+08, grad_fn=<MseLossBackward>)
output :  tensor([[236972.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(24723892., grad_fn=<MseLossBackward>)
output :  tensor([[179722.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(604384.7500, grad_fn=<MseLossBackward>)
output :  tensor([[152874.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(765515.6250, grad_fn=<MseLossBackward>)
output :  tensor([[144259.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(548803.1875, grad_fn=<MseLossBackward>)
output :  tensor([[156730.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9325e+08, grad_fn=<MseLossBackward>)
output :  tensor([[101669.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(2786108.7500, grad_fn=<MseLossBackward>)
output :  tensor([[82627.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1198e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165284.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(80922.4688, grad_fn=<MseLossBackward>)
output :  tensor([[188499.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5603e+09, grad_fn=<MseLossBackward>)
output :  tensor([[160609.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(6810876.5000, grad_fn=<MseLossBackward>)
output :  tensor([[155223.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(5182594.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139333.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(3547336.7500, grad_fn=<MseLossBackward>)
output :  tensor([[207671.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2964638.2500, grad_fn=<MseLossBackward>)
output :  tensor([[139635.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2674604.7500, grad_fn=<MseLossBackward>)
output :  tensor([[182031.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6376e+10, grad_fn=<MseLossBackward>)
output :  tensor([[140752.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(27532648., grad_fn=<MseLossBackward>)
output :  tensor([[111393.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0619e+08, grad_fn=<MseLossBackward>)
output :  tensor([[96756.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(7600876.5000, grad_fn=<MseLossBackward>)
output :  tensor([[173551.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2096930.2500, grad_fn=<MseLossBackward>)
output :  tensor([[260454.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2994.1416, grad_fn=<MseLossBackward>)
output :  tensor([[141254.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(60431.4688, grad_fn=<MseLossBackward>)
output :  tensor([[160405.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(260578.3438, grad_fn=<MseLossBackward>)
output :  tensor([[134498.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(3993939.7500, grad_fn=<MseLossBackward>)
output :  tensor([[148223.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1628375.3750, grad_fn=<MseLossBackward>)
output :  tensor([[166542.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1843060.7500, grad_fn=<MseLossBackward>)
output :  tensor([[126286.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(508747.8438, grad_fn=<MseLossBackward>)
output :  tensor([[176070.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6536e+08, grad_fn=<MseLossBackward>)
output :  tensor([[158903.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3624918.5000, grad_fn=<MseLossBackward>)
output :  tensor([[118193.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2868365.7500, grad_fn=<MseLossBackward>)
output :  tensor([[159920.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3406e+09, grad_fn=<MseLossBackward>)
output :  tensor([[52298.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(89284.2422, grad_fn=<MseLossBackward>)
output :  tensor([[232743.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3611e+09, grad_fn=<MseLossBackward>)
output :  tensor([[200075.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(854613.5625, grad_fn=<MseLossBackward>)
output :  tensor([[182548.]], grad_fn=<AddmmBackward>)
loss:  tensor(6012304., grad_fn=<MseLossBackward>)
output :  tensor([[105692.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(94537.0312, grad_fn=<MseLossBackward>)
output :  tensor([[86646.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(125083.7969, grad_fn=<MseLossBackward>)
output :  tensor([[137025.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(8847093., grad_fn=<MseLossBackward>)
output :  tensor([[217938.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7853e+09, grad_fn=<MseLossBackward>)
output :  tensor([[199894.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(57850284., grad_fn=<MseLossBackward>)
output :  tensor([[167969.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(8815054., grad_fn=<MseLossBackward>)
output :  tensor([[171709.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7032e+09, grad_fn=<MseLossBackward>)
output :  tensor([[191059.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1122838.2500, grad_fn=<MseLossBackward>)
output :  tensor([[87609.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(372014.2188, grad_fn=<MseLossBackward>)
output :  tensor([[140558.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(311835., grad_fn=<MseLossBackward>)
output :  tensor([[113847.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(11207535., grad_fn=<MseLossBackward>)
output :  tensor([[150055.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9867e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174821.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9203e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193596.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3004e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180852.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(726143.6250, grad_fn=<MseLossBackward>)
output :  tensor([[97491.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(982824.3750, grad_fn=<MseLossBackward>)
output :  tensor([[118368.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(754658.6875, grad_fn=<MseLossBackward>)
output :  tensor([[161200.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1983e+08, grad_fn=<MseLossBackward>)
output :  tensor([[197506.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(6215750., grad_fn=<MseLossBackward>)
output :  tensor([[143781.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(47537.6250, grad_fn=<MseLossBackward>)
train_loss: [2.654155e+09]
epoch_result tensor([0.])
output :  tensor([[158828.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(108086.8359, grad_fn=<MseLossBackward>)
output :  tensor([[124427.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(5891087.5000, grad_fn=<MseLossBackward>)
output :  tensor([[194719.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(268890.8750, grad_fn=<MseLossBackward>)
output :  tensor([[176930.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(4873.7852, grad_fn=<MseLossBackward>)
output :  tensor([[155729.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9598e+08, grad_fn=<MseLossBackward>)
output :  tensor([[126906.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1195195.5000, grad_fn=<MseLossBackward>)
output :  tensor([[141510.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(260179.6875, grad_fn=<MseLossBackward>)
output :  tensor([[120901.4922]], grad_fn=<AddmmBackward>)
loss:  tensor(3615672.5000, grad_fn=<MseLossBackward>)
output :  tensor([[70613.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4674e+08, grad_fn=<MseLossBackward>)
output :  tensor([[167066.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1137422.2500, grad_fn=<MseLossBackward>)
output :  tensor([[139967.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1052.1914, grad_fn=<MseLossBackward>)
output :  tensor([[224362.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(406665.2812, grad_fn=<MseLossBackward>)
output :  tensor([[168369.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(397983.5625, grad_fn=<MseLossBackward>)
output :  tensor([[247734.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3864050.2500, grad_fn=<MseLossBackward>)
output :  tensor([[55536.7461]], grad_fn=<AddmmBackward>)
loss:  tensor(288096.3750, grad_fn=<MseLossBackward>)
output :  tensor([[164347.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9392e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179836.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(23392336., grad_fn=<MseLossBackward>)
output :  tensor([[167825.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2826e+08, grad_fn=<MseLossBackward>)
output :  tensor([[275594.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(353244.5000, grad_fn=<MseLossBackward>)
output :  tensor([[196515.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(235194.6875, grad_fn=<MseLossBackward>)
output :  tensor([[135508.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6725e+10, grad_fn=<MseLossBackward>)
output :  tensor([[195742.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(3470943.7500, grad_fn=<MseLossBackward>)
output :  tensor([[177726.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2253e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150859.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(19770.9961, grad_fn=<MseLossBackward>)
output :  tensor([[179429.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(88907808., grad_fn=<MseLossBackward>)
output :  tensor([[85167.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(53853.0039, grad_fn=<MseLossBackward>)
output :  tensor([[167522.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9727e+09, grad_fn=<MseLossBackward>)
output :  tensor([[185243.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(59513.1289, grad_fn=<MseLossBackward>)
output :  tensor([[203172.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7381e+09, grad_fn=<MseLossBackward>)
output :  tensor([[108519.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(2192505., grad_fn=<MseLossBackward>)
output :  tensor([[169969.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1062284.5000, grad_fn=<MseLossBackward>)
output :  tensor([[136200.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(89419.6875, grad_fn=<MseLossBackward>)
output :  tensor([[125584.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(11667935., grad_fn=<MseLossBackward>)
output :  tensor([[121442.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(3771697.7500, grad_fn=<MseLossBackward>)
output :  tensor([[147826.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(9.5025e+08, grad_fn=<MseLossBackward>)
output :  tensor([[171397.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0622e+10, grad_fn=<MseLossBackward>)
output :  tensor([[153100.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(11560106., grad_fn=<MseLossBackward>)
output :  tensor([[181491.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2224432.5000, grad_fn=<MseLossBackward>)
output :  tensor([[141079.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(6320.2500, grad_fn=<MseLossBackward>)
output :  tensor([[104741.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1732e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136643.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1397e+09, grad_fn=<MseLossBackward>)
output :  tensor([[134433.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(321329.5625, grad_fn=<MseLossBackward>)
output :  tensor([[133744.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(45488492., grad_fn=<MseLossBackward>)
output :  tensor([[224742.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(66491.4609, grad_fn=<MseLossBackward>)
output :  tensor([[132694.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(197621.9219, grad_fn=<MseLossBackward>)
output :  tensor([[146968.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(4126611.2500, grad_fn=<MseLossBackward>)
output :  tensor([[110427.4922]], grad_fn=<AddmmBackward>)
loss:  tensor(2472780.7500, grad_fn=<MseLossBackward>)
output :  tensor([[160412.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(169847.0156, grad_fn=<MseLossBackward>)
output :  tensor([[143544.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6477e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195649.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(13315771., grad_fn=<MseLossBackward>)
output :  tensor([[133977.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(223669.8750, grad_fn=<MseLossBackward>)
output :  tensor([[117457.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(55609064., grad_fn=<MseLossBackward>)
output :  tensor([[234304.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(92777.3516, grad_fn=<MseLossBackward>)
output :  tensor([[163568.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4921e+09, grad_fn=<MseLossBackward>)
output :  tensor([[154686.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(18608844., grad_fn=<MseLossBackward>)
output :  tensor([[204616.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8185e+10, grad_fn=<MseLossBackward>)
output :  tensor([[245416.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1790e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145093.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2539640.7500, grad_fn=<MseLossBackward>)
output :  tensor([[135500.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2252344.2500, grad_fn=<MseLossBackward>)
output :  tensor([[156193.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1424442.2500, grad_fn=<MseLossBackward>)
output :  tensor([[132429.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(5902546., grad_fn=<MseLossBackward>)
output :  tensor([[182668.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9802e+09, grad_fn=<MseLossBackward>)
output :  tensor([[185010.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(828896.4375, grad_fn=<MseLossBackward>)
output :  tensor([[162428.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(861242., grad_fn=<MseLossBackward>)
output :  tensor([[154908.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4180e+08, grad_fn=<MseLossBackward>)
output :  tensor([[141816.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(466830.5625, grad_fn=<MseLossBackward>)
output :  tensor([[148871.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(14986093., grad_fn=<MseLossBackward>)
output :  tensor([[170951.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7245e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193397.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5706e+08, grad_fn=<MseLossBackward>)
output :  tensor([[138399.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(3607150.5000, grad_fn=<MseLossBackward>)
output :  tensor([[172180.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(78408.7500, grad_fn=<MseLossBackward>)
output :  tensor([[174892.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(37304992., grad_fn=<MseLossBackward>)
output :  tensor([[116558.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2427704.7500, grad_fn=<MseLossBackward>)
output :  tensor([[220611.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(150798.7344, grad_fn=<MseLossBackward>)
output :  tensor([[183248.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(63448.8867, grad_fn=<MseLossBackward>)
output :  tensor([[126036.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(288293.5000, grad_fn=<MseLossBackward>)
output :  tensor([[197782.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1645287.2500, grad_fn=<MseLossBackward>)
output :  tensor([[178655.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(14102607., grad_fn=<MseLossBackward>)
output :  tensor([[205450.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2688e+10, grad_fn=<MseLossBackward>)
output :  tensor([[209977.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1046049.5000, grad_fn=<MseLossBackward>)
output :  tensor([[169668.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4953e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194161.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(114910.4062, grad_fn=<MseLossBackward>)
output :  tensor([[112723.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(76491.1406, grad_fn=<MseLossBackward>)
output :  tensor([[113581.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1169845., grad_fn=<MseLossBackward>)
output :  tensor([[113138.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(1295132.8750, grad_fn=<MseLossBackward>)
output :  tensor([[150394.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(12918521., grad_fn=<MseLossBackward>)
output :  tensor([[160542.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3161e+10, grad_fn=<MseLossBackward>)
output :  tensor([[180225.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(50906.6406, grad_fn=<MseLossBackward>)
output :  tensor([[129813.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(5353656., grad_fn=<MseLossBackward>)
output :  tensor([[142470.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(6398923.5000, grad_fn=<MseLossBackward>)
output :  tensor([[182935.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3074e+09, grad_fn=<MseLossBackward>)
output :  tensor([[120572.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(13487371., grad_fn=<MseLossBackward>)
output :  tensor([[199314.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(5355825.5000, grad_fn=<MseLossBackward>)
output :  tensor([[151127.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(37540320., grad_fn=<MseLossBackward>)
output :  tensor([[212498.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(161076.8125, grad_fn=<MseLossBackward>)
output :  tensor([[127031.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1064379.1250, grad_fn=<MseLossBackward>)
output :  tensor([[246610.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2949055., grad_fn=<MseLossBackward>)
output :  tensor([[233916.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6095e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151127.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8918e+08, grad_fn=<MseLossBackward>)
output :  tensor([[86183.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3422e+08, grad_fn=<MseLossBackward>)
output :  tensor([[191138.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0159e+09, grad_fn=<MseLossBackward>)
output :  tensor([[82368.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1871894.2500, grad_fn=<MseLossBackward>)
output :  tensor([[139641.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(19885.4062, grad_fn=<MseLossBackward>)
output :  tensor([[78620.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(9734888., grad_fn=<MseLossBackward>)
output :  tensor([[142595.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(127705.7266, grad_fn=<MseLossBackward>)
output :  tensor([[175727.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(74188.1406, grad_fn=<MseLossBackward>)
output :  tensor([[152370.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1276229.1250, grad_fn=<MseLossBackward>)
output :  tensor([[106694.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(497410.6250, grad_fn=<MseLossBackward>)
output :  tensor([[200368.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3313e+10, grad_fn=<MseLossBackward>)
output :  tensor([[127579.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(847176.4375, grad_fn=<MseLossBackward>)
output :  tensor([[268091.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4181e+08, grad_fn=<MseLossBackward>)
output :  tensor([[300855.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(83628168., grad_fn=<MseLossBackward>)
output :  tensor([[109761.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(5112262.5000, grad_fn=<MseLossBackward>)
output :  tensor([[169732.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(7658451., grad_fn=<MseLossBackward>)
output :  tensor([[134781.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1724e+08, grad_fn=<MseLossBackward>)
output :  tensor([[139207.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(43114.6289, grad_fn=<MseLossBackward>)
output :  tensor([[131511.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1591579.3750, grad_fn=<MseLossBackward>)
output :  tensor([[127921.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(8532652., grad_fn=<MseLossBackward>)
output :  tensor([[135535.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7786e+08, grad_fn=<MseLossBackward>)
output :  tensor([[228463.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7844e+10, grad_fn=<MseLossBackward>)
output :  tensor([[186043.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4012e+10, grad_fn=<MseLossBackward>)
output :  tensor([[142111.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3200409.2500, grad_fn=<MseLossBackward>)
output :  tensor([[127210.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(83801.2031, grad_fn=<MseLossBackward>)
output :  tensor([[111008.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(58303.3828, grad_fn=<MseLossBackward>)
output :  tensor([[251261.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4622e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136784.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(3185332.5000, grad_fn=<MseLossBackward>)
output :  tensor([[203166.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(27836.8359, grad_fn=<MseLossBackward>)
output :  tensor([[106187.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(1658159.2500, grad_fn=<MseLossBackward>)
output :  tensor([[140735.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(616789.3750, grad_fn=<MseLossBackward>)
output :  tensor([[208155.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6714e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174839.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(25609450., grad_fn=<MseLossBackward>)
output :  tensor([[187762.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(7631838., grad_fn=<MseLossBackward>)
output :  tensor([[164982.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0741e+10, grad_fn=<MseLossBackward>)
output :  tensor([[292232.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8290e+09, grad_fn=<MseLossBackward>)
output :  tensor([[197875.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(588.8206, grad_fn=<MseLossBackward>)
output :  tensor([[261505.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9981e+10, grad_fn=<MseLossBackward>)
output :  tensor([[214034.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7004e+09, grad_fn=<MseLossBackward>)
output :  tensor([[284988.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0247e+09, grad_fn=<MseLossBackward>)
output :  tensor([[223195.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(647144.8125, grad_fn=<MseLossBackward>)
output :  tensor([[222599.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8697e+10, grad_fn=<MseLossBackward>)
output :  tensor([[204761.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(60233364., grad_fn=<MseLossBackward>)
output :  tensor([[160155.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(9.7067e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129306.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(10200887., grad_fn=<MseLossBackward>)
output :  tensor([[135726.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(51146.6484, grad_fn=<MseLossBackward>)
output :  tensor([[92868.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(3492898.2500, grad_fn=<MseLossBackward>)
output :  tensor([[106557.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2081572.6250, grad_fn=<MseLossBackward>)
output :  tensor([[271997.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2379e+09, grad_fn=<MseLossBackward>)
output :  tensor([[237649.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(7021092.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144028.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(943539.0625, grad_fn=<MseLossBackward>)
output :  tensor([[135984.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2295840.5000, grad_fn=<MseLossBackward>)
output :  tensor([[174769.]], grad_fn=<AddmmBackward>)
loss:  tensor(1073296., grad_fn=<MseLossBackward>)
output :  tensor([[142295.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(8729440., grad_fn=<MseLossBackward>)
output :  tensor([[164190.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(9.1868e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166405.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1974771.5000, grad_fn=<MseLossBackward>)
output :  tensor([[137424.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(180439.1094, grad_fn=<MseLossBackward>)
output :  tensor([[191785.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8005e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113413.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(1996900.1250, grad_fn=<MseLossBackward>)
output :  tensor([[176311.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(18587280., grad_fn=<MseLossBackward>)
output :  tensor([[121053.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(1110636., grad_fn=<MseLossBackward>)
output :  tensor([[85923.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(1158566.3750, grad_fn=<MseLossBackward>)
output :  tensor([[180526.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(277169.3438, grad_fn=<MseLossBackward>)
output :  tensor([[112495.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(6736863.5000, grad_fn=<MseLossBackward>)
output :  tensor([[238317.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(465465.0625, grad_fn=<MseLossBackward>)
output :  tensor([[244371.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(395464.1250, grad_fn=<MseLossBackward>)
output :  tensor([[132118.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(6855887.5000, grad_fn=<MseLossBackward>)
output :  tensor([[114375.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(29343720., grad_fn=<MseLossBackward>)
output :  tensor([[287241.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2474e+10, grad_fn=<MseLossBackward>)
output :  tensor([[171940.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(193723.7656, grad_fn=<MseLossBackward>)
output :  tensor([[124500.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(249164.7656, grad_fn=<MseLossBackward>)
output :  tensor([[144207.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8683e+08, grad_fn=<MseLossBackward>)
output :  tensor([[196886.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9286e+08, grad_fn=<MseLossBackward>)
output :  tensor([[143105.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(4431156.5000, grad_fn=<MseLossBackward>)
output :  tensor([[155178.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5580e+10, grad_fn=<MseLossBackward>)
output :  tensor([[153117.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(612453., grad_fn=<MseLossBackward>)
output :  tensor([[131567.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(4273652., grad_fn=<MseLossBackward>)
output :  tensor([[240755.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8974e+10, grad_fn=<MseLossBackward>)
output :  tensor([[396465.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(30628614., grad_fn=<MseLossBackward>)
output :  tensor([[109904.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(818643.2500, grad_fn=<MseLossBackward>)
output :  tensor([[113494.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(25058862., grad_fn=<MseLossBackward>)
output :  tensor([[158663.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(699967.5625, grad_fn=<MseLossBackward>)
output :  tensor([[134232.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9076e+08, grad_fn=<MseLossBackward>)
output :  tensor([[160888.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7346e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174542.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1657e+09, grad_fn=<MseLossBackward>)
output :  tensor([[105886.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(5225831.5000, grad_fn=<MseLossBackward>)
output :  tensor([[141067.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(4621.8750, grad_fn=<MseLossBackward>)
output :  tensor([[366298.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(991269.1250, grad_fn=<MseLossBackward>)
output :  tensor([[201554.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7506e+09, grad_fn=<MseLossBackward>)
output :  tensor([[179727.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(17874530., grad_fn=<MseLossBackward>)
output :  tensor([[202955.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(3095.8792, grad_fn=<MseLossBackward>)
output :  tensor([[139450.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(202570.3125, grad_fn=<MseLossBackward>)
output :  tensor([[196413.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3661960.7500, grad_fn=<MseLossBackward>)
output :  tensor([[137015.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7118e+08, grad_fn=<MseLossBackward>)
output :  tensor([[182383.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1914720.8750, grad_fn=<MseLossBackward>)
output :  tensor([[239280.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(7393131., grad_fn=<MseLossBackward>)
output :  tensor([[173524.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(225639.8438, grad_fn=<MseLossBackward>)
output :  tensor([[107031.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(937962., grad_fn=<MseLossBackward>)
output :  tensor([[264364.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(38526.3281, grad_fn=<MseLossBackward>)
output :  tensor([[255532.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(30607174., grad_fn=<MseLossBackward>)
output :  tensor([[122347.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(425746.0625, grad_fn=<MseLossBackward>)
output :  tensor([[212617.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8915e+09, grad_fn=<MseLossBackward>)
output :  tensor([[301547.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6420e+08, grad_fn=<MseLossBackward>)
output :  tensor([[209938.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(8636894., grad_fn=<MseLossBackward>)
output :  tensor([[213451.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6015e+10, grad_fn=<MseLossBackward>)
output :  tensor([[158485.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(342883.4375, grad_fn=<MseLossBackward>)
output :  tensor([[172332.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(5488331., grad_fn=<MseLossBackward>)
output :  tensor([[156864.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(4581.5977, grad_fn=<MseLossBackward>)
output :  tensor([[166750.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(10560977., grad_fn=<MseLossBackward>)
output :  tensor([[233204.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2107e+09, grad_fn=<MseLossBackward>)
output :  tensor([[217796.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3594e+08, grad_fn=<MseLossBackward>)
output :  tensor([[164256.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9779e+08, grad_fn=<MseLossBackward>)
output :  tensor([[120785.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(4903283.5000, grad_fn=<MseLossBackward>)
output :  tensor([[175620.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1903925.6250, grad_fn=<MseLossBackward>)
output :  tensor([[178789.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5951e+09, grad_fn=<MseLossBackward>)
output :  tensor([[201557.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7272e+10, grad_fn=<MseLossBackward>)
output :  tensor([[133400.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1064701.5000, grad_fn=<MseLossBackward>)
output :  tensor([[149625.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8540e+08, grad_fn=<MseLossBackward>)
output :  tensor([[274678.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(5390813.5000, grad_fn=<MseLossBackward>)
output :  tensor([[90731.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(32848390., grad_fn=<MseLossBackward>)
output :  tensor([[236974.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(225224.3906, grad_fn=<MseLossBackward>)
output :  tensor([[256861.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0632e+11, grad_fn=<MseLossBackward>)
output :  tensor([[169919.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(6422.5195, grad_fn=<MseLossBackward>)
output :  tensor([[193022.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7621e+09, grad_fn=<MseLossBackward>)
output :  tensor([[153459.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2373381., grad_fn=<MseLossBackward>)
output :  tensor([[204940.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2328e+09, grad_fn=<MseLossBackward>)
output :  tensor([[127238.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(3101231., grad_fn=<MseLossBackward>)
output :  tensor([[155070.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0141e+08, grad_fn=<MseLossBackward>)
output :  tensor([[169704.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4010e+08, grad_fn=<MseLossBackward>)
output :  tensor([[183053.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(7818053., grad_fn=<MseLossBackward>)
output :  tensor([[124278.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(2961868., grad_fn=<MseLossBackward>)
output :  tensor([[138902.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(5774183.5000, grad_fn=<MseLossBackward>)
output :  tensor([[177984.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(24850070., grad_fn=<MseLossBackward>)
output :  tensor([[197215.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7862e+09, grad_fn=<MseLossBackward>)
output :  tensor([[239790.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(10300389., grad_fn=<MseLossBackward>)
output :  tensor([[153619.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1905176.3750, grad_fn=<MseLossBackward>)
output :  tensor([[195847.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(23156.2793, grad_fn=<MseLossBackward>)
output :  tensor([[163294.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7226e+08, grad_fn=<MseLossBackward>)
output :  tensor([[196026.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7314e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179746.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(23648.6719, grad_fn=<MseLossBackward>)
output :  tensor([[97200.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(40003.1250, grad_fn=<MseLossBackward>)
output :  tensor([[173701.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1299e+10, grad_fn=<MseLossBackward>)
output :  tensor([[137277.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(5188714.5000, grad_fn=<MseLossBackward>)
output :  tensor([[123211.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(67428216., grad_fn=<MseLossBackward>)
output :  tensor([[173633.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(134574.3438, grad_fn=<MseLossBackward>)
output :  tensor([[87937.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(8629090., grad_fn=<MseLossBackward>)
output :  tensor([[289795.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(41948.1602, grad_fn=<MseLossBackward>)
output :  tensor([[168703.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(13718806., grad_fn=<MseLossBackward>)
output :  tensor([[191935.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9947e+10, grad_fn=<MseLossBackward>)
output :  tensor([[241052.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(8.9686e+08, grad_fn=<MseLossBackward>)
output :  tensor([[155555.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(20749734., grad_fn=<MseLossBackward>)
output :  tensor([[123564.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(189496.9688, grad_fn=<MseLossBackward>)
output :  tensor([[121219.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(1741925.6250, grad_fn=<MseLossBackward>)
output :  tensor([[147914.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0833e+09, grad_fn=<MseLossBackward>)
output :  tensor([[176311.]], grad_fn=<AddmmBackward>)
loss:  tensor(5340721., grad_fn=<MseLossBackward>)
output :  tensor([[113558.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6465e+08, grad_fn=<MseLossBackward>)
output :  tensor([[206347.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2466e+10, grad_fn=<MseLossBackward>)
output :  tensor([[234347.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(51157140., grad_fn=<MseLossBackward>)
output :  tensor([[250587.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0911e+10, grad_fn=<MseLossBackward>)
output :  tensor([[219411.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8371e+08, grad_fn=<MseLossBackward>)
output :  tensor([[194358.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4675e+10, grad_fn=<MseLossBackward>)
output :  tensor([[190035.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(6427651., grad_fn=<MseLossBackward>)
output :  tensor([[207838.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7103e+10, grad_fn=<MseLossBackward>)
output :  tensor([[187988.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1907e+10, grad_fn=<MseLossBackward>)
output :  tensor([[179441.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(491883.0625, grad_fn=<MseLossBackward>)
output :  tensor([[151711.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(83412.6562, grad_fn=<MseLossBackward>)
output :  tensor([[328394.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(74062696., grad_fn=<MseLossBackward>)
output :  tensor([[209012.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(8926837., grad_fn=<MseLossBackward>)
output :  tensor([[156397.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(12978682., grad_fn=<MseLossBackward>)
output :  tensor([[184445.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2552e+09, grad_fn=<MseLossBackward>)
output :  tensor([[109112.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(16915806., grad_fn=<MseLossBackward>)
output :  tensor([[268970.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1813e+10, grad_fn=<MseLossBackward>)
output :  tensor([[170568.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(11100558., grad_fn=<MseLossBackward>)
output :  tensor([[218237.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(22447756., grad_fn=<MseLossBackward>)
output :  tensor([[206681.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0502e+08, grad_fn=<MseLossBackward>)
output :  tensor([[182017.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(7939363., grad_fn=<MseLossBackward>)
output :  tensor([[207376.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(31094738., grad_fn=<MseLossBackward>)
output :  tensor([[157601.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(6766257.5000, grad_fn=<MseLossBackward>)
output :  tensor([[150593.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5597e+09, grad_fn=<MseLossBackward>)
output :  tensor([[118369.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(17007.8281, grad_fn=<MseLossBackward>)
output :  tensor([[143215.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(10337833., grad_fn=<MseLossBackward>)
output :  tensor([[146685.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(5354957.5000, grad_fn=<MseLossBackward>)
output :  tensor([[200797.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6181e+10, grad_fn=<MseLossBackward>)
output :  tensor([[160515.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1030510.5000, grad_fn=<MseLossBackward>)
output :  tensor([[99519.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(384.2213, grad_fn=<MseLossBackward>)
output :  tensor([[227532.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5544e+08, grad_fn=<MseLossBackward>)
output :  tensor([[189040.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5416e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175140.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1807596.2500, grad_fn=<MseLossBackward>)
output :  tensor([[84007.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(4030432.7500, grad_fn=<MseLossBackward>)
output :  tensor([[129694.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(1426998.2500, grad_fn=<MseLossBackward>)
output :  tensor([[213132.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(751905.7500, grad_fn=<MseLossBackward>)
output :  tensor([[143548.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(204134.5312, grad_fn=<MseLossBackward>)
output :  tensor([[128532.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2152547.5000, grad_fn=<MseLossBackward>)
output :  tensor([[147414.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(23176250., grad_fn=<MseLossBackward>)
output :  tensor([[177907.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6327e+09, grad_fn=<MseLossBackward>)
output :  tensor([[148080.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(16653796., grad_fn=<MseLossBackward>)
output :  tensor([[160990.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(982050.0625, grad_fn=<MseLossBackward>)
output :  tensor([[215746.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(556632.5625, grad_fn=<MseLossBackward>)
output :  tensor([[139305.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1769e+09, grad_fn=<MseLossBackward>)
output :  tensor([[256675.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2807457.2500, grad_fn=<MseLossBackward>)
output :  tensor([[159348.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(22956.9844, grad_fn=<MseLossBackward>)
output :  tensor([[131120.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(6864727.5000, grad_fn=<MseLossBackward>)
output :  tensor([[94367.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(399779.5938, grad_fn=<MseLossBackward>)
output :  tensor([[156224.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1444e+09, grad_fn=<MseLossBackward>)
output :  tensor([[179579.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(102750.2969, grad_fn=<MseLossBackward>)
output :  tensor([[122627.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(4526522., grad_fn=<MseLossBackward>)
output :  tensor([[187466.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7209e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144802.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2645e+09, grad_fn=<MseLossBackward>)
output :  tensor([[147870.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(4120519.5000, grad_fn=<MseLossBackward>)
output :  tensor([[186904.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(714183.4375, grad_fn=<MseLossBackward>)
output :  tensor([[253155.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5937e+09, grad_fn=<MseLossBackward>)
output :  tensor([[89793.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(2911049.2500, grad_fn=<MseLossBackward>)
output :  tensor([[239479.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(271001.5938, grad_fn=<MseLossBackward>)
output :  tensor([[129727.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1506142.5000, grad_fn=<MseLossBackward>)
output :  tensor([[165131.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0154e+10, grad_fn=<MseLossBackward>)
output :  tensor([[115710.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4683e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175401.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(358557.6875, grad_fn=<MseLossBackward>)
output :  tensor([[165724.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9298e+08, grad_fn=<MseLossBackward>)
output :  tensor([[158508.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8445e+08, grad_fn=<MseLossBackward>)
output :  tensor([[235895.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(9639181., grad_fn=<MseLossBackward>)
output :  tensor([[226369.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0005e+09, grad_fn=<MseLossBackward>)
output :  tensor([[125263.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(3014401.2500, grad_fn=<MseLossBackward>)
output :  tensor([[123655.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(5494922., grad_fn=<MseLossBackward>)
output :  tensor([[222896.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(16838072., grad_fn=<MseLossBackward>)
output :  tensor([[230463.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(12503628., grad_fn=<MseLossBackward>)
output :  tensor([[226213.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(236287.1406, grad_fn=<MseLossBackward>)
output :  tensor([[147059.]], grad_fn=<AddmmBackward>)
loss:  tensor(885481., grad_fn=<MseLossBackward>)
output :  tensor([[206712.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(10807554., grad_fn=<MseLossBackward>)
output :  tensor([[134973.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2419e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137970.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(29923976., grad_fn=<MseLossBackward>)
output :  tensor([[308319.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(44628244., grad_fn=<MseLossBackward>)
output :  tensor([[143670.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(7133573.5000, grad_fn=<MseLossBackward>)
output :  tensor([[119658.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7729e+09, grad_fn=<MseLossBackward>)
output :  tensor([[107947.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2410207.7500, grad_fn=<MseLossBackward>)
output :  tensor([[155133.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0159e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178389.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2805e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174247.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1555398.7500, grad_fn=<MseLossBackward>)
output :  tensor([[193400.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(57754536., grad_fn=<MseLossBackward>)
output :  tensor([[102936.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(8625418., grad_fn=<MseLossBackward>)
output :  tensor([[180423.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2025462.6250, grad_fn=<MseLossBackward>)
output :  tensor([[167424.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(225951.6875, grad_fn=<MseLossBackward>)
output :  tensor([[142608.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(13020032., grad_fn=<MseLossBackward>)
output :  tensor([[263256.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(9.1860e+09, grad_fn=<MseLossBackward>)
output :  tensor([[142669.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3257e+09, grad_fn=<MseLossBackward>)
output :  tensor([[176001.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(9008439., grad_fn=<MseLossBackward>)
output :  tensor([[141412.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1995995., grad_fn=<MseLossBackward>)
output :  tensor([[203380.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(8296380., grad_fn=<MseLossBackward>)
output :  tensor([[171284.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1649498.7500, grad_fn=<MseLossBackward>)
output :  tensor([[242101.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3606082.2500, grad_fn=<MseLossBackward>)
output :  tensor([[133949.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(302568.7500, grad_fn=<MseLossBackward>)
output :  tensor([[152192.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(8080872., grad_fn=<MseLossBackward>)
output :  tensor([[214088.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(831117.1250, grad_fn=<MseLossBackward>)
output :  tensor([[166109.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1230192.8750, grad_fn=<MseLossBackward>)
output :  tensor([[193351.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(18937864., grad_fn=<MseLossBackward>)
output :  tensor([[135065.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7284e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129977.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(956071.4375, grad_fn=<MseLossBackward>)
output :  tensor([[141611.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2597838.7500, grad_fn=<MseLossBackward>)
output :  tensor([[198571.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0309e+09, grad_fn=<MseLossBackward>)
output :  tensor([[165572.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5575e+09, grad_fn=<MseLossBackward>)
output :  tensor([[78185.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3070e+08, grad_fn=<MseLossBackward>)
output :  tensor([[96120.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3504e+08, grad_fn=<MseLossBackward>)
output :  tensor([[259902.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(43681980., grad_fn=<MseLossBackward>)
output :  tensor([[203253.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1286e+09, grad_fn=<MseLossBackward>)
output :  tensor([[117453.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(6021004., grad_fn=<MseLossBackward>)
output :  tensor([[159683.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7374e+08, grad_fn=<MseLossBackward>)
output :  tensor([[206137.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9217e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179948.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1093e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158122.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(9751568., grad_fn=<MseLossBackward>)
output :  tensor([[168476.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2319624.2500, grad_fn=<MseLossBackward>)
output :  tensor([[116197.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1433370.1250, grad_fn=<MseLossBackward>)
output :  tensor([[165069.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0140e+08, grad_fn=<MseLossBackward>)
output :  tensor([[193258.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8609e+08, grad_fn=<MseLossBackward>)
output :  tensor([[218272.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1507024.7500, grad_fn=<MseLossBackward>)
output :  tensor([[244732.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5027e+11, grad_fn=<MseLossBackward>)
output :  tensor([[148564.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2446438.2500, grad_fn=<MseLossBackward>)
output :  tensor([[111473.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(8959265., grad_fn=<MseLossBackward>)
output :  tensor([[171866.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0066e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148633.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(3482189.2500, grad_fn=<MseLossBackward>)
output :  tensor([[232551.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(19791516., grad_fn=<MseLossBackward>)
output :  tensor([[117372.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(5628348.5000, grad_fn=<MseLossBackward>)
output :  tensor([[182818.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(6675.4004, grad_fn=<MseLossBackward>)
output :  tensor([[188415.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(2941707.2500, grad_fn=<MseLossBackward>)
output :  tensor([[163550.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4476e+10, grad_fn=<MseLossBackward>)
output :  tensor([[97457.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7086e+08, grad_fn=<MseLossBackward>)
output :  tensor([[237096.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(3624561.5000, grad_fn=<MseLossBackward>)
output :  tensor([[178108.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(4444059.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138179.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(3314391., grad_fn=<MseLossBackward>)
output :  tensor([[235060.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(3707.6682, grad_fn=<MseLossBackward>)
output :  tensor([[163449.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(202190.7500, grad_fn=<MseLossBackward>)
output :  tensor([[201846.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5167e+10, grad_fn=<MseLossBackward>)
output :  tensor([[133066.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(3739510., grad_fn=<MseLossBackward>)
output :  tensor([[185840.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6835e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135812.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(35138.6758, grad_fn=<MseLossBackward>)
output :  tensor([[225930.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0139e+08, grad_fn=<MseLossBackward>)
output :  tensor([[223329.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1134e+08, grad_fn=<MseLossBackward>)
output :  tensor([[88750.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1562304.7500, grad_fn=<MseLossBackward>)
output :  tensor([[158992.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(194549.9062, grad_fn=<MseLossBackward>)
output :  tensor([[245422.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5739e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145658.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(434095.6875, grad_fn=<MseLossBackward>)
output :  tensor([[112041.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0287e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166355.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(3443982., grad_fn=<MseLossBackward>)
output :  tensor([[138349.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(31926384., grad_fn=<MseLossBackward>)
output :  tensor([[129410.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(1466350.7500, grad_fn=<MseLossBackward>)
output :  tensor([[191066.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6149e+09, grad_fn=<MseLossBackward>)
output :  tensor([[123111.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(373722.0625, grad_fn=<MseLossBackward>)
output :  tensor([[150065.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(3742894.7500, grad_fn=<MseLossBackward>)
output :  tensor([[169687.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(4254551., grad_fn=<MseLossBackward>)
output :  tensor([[149037.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(3851958.2500, grad_fn=<MseLossBackward>)
output :  tensor([[161316.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2506037.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135600.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0759e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131071.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(862547.5625, grad_fn=<MseLossBackward>)
output :  tensor([[157012.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2446e+08, grad_fn=<MseLossBackward>)
output :  tensor([[145446.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1674557.3750, grad_fn=<MseLossBackward>)
output :  tensor([[163697.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3793486.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144031.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1650e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151571.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(7682771.5000, grad_fn=<MseLossBackward>)
output :  tensor([[187006.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(987849.6250, grad_fn=<MseLossBackward>)
output :  tensor([[168338.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(437168.9062, grad_fn=<MseLossBackward>)
output :  tensor([[180341.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(116878.5156, grad_fn=<MseLossBackward>)
output :  tensor([[219608.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(153492.5469, grad_fn=<MseLossBackward>)
output :  tensor([[111530.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(13181041., grad_fn=<MseLossBackward>)
output :  tensor([[140450.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4181e+08, grad_fn=<MseLossBackward>)
output :  tensor([[283088.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(8474103., grad_fn=<MseLossBackward>)
output :  tensor([[120489.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(20154698., grad_fn=<MseLossBackward>)
output :  tensor([[176080.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9289e+09, grad_fn=<MseLossBackward>)
output :  tensor([[184442.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(311172.2188, grad_fn=<MseLossBackward>)
output :  tensor([[188295.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(7817179., grad_fn=<MseLossBackward>)
output :  tensor([[253408.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6621e+08, grad_fn=<MseLossBackward>)
output :  tensor([[221159.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(706702.9375, grad_fn=<MseLossBackward>)
output :  tensor([[131736.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6750e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177493.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9995e+08, grad_fn=<MseLossBackward>)
output :  tensor([[125052.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1108644.5000, grad_fn=<MseLossBackward>)
output :  tensor([[182803.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5524e+10, grad_fn=<MseLossBackward>)
output :  tensor([[155223.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4945898., grad_fn=<MseLossBackward>)
output :  tensor([[155927.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(88879816., grad_fn=<MseLossBackward>)
output :  tensor([[204863.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2064295.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145505.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6914e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177310.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1718352.2500, grad_fn=<MseLossBackward>)
output :  tensor([[247633.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0154e+09, grad_fn=<MseLossBackward>)
output :  tensor([[148305.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(93301.6094, grad_fn=<MseLossBackward>)
output :  tensor([[203087.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(178889.3438, grad_fn=<MseLossBackward>)
output :  tensor([[161866.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(3673930.5000, grad_fn=<MseLossBackward>)
output :  tensor([[127437.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5553e+09, grad_fn=<MseLossBackward>)
output :  tensor([[138568.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(7942885.5000, grad_fn=<MseLossBackward>)
output :  tensor([[183269.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(533698.7500, grad_fn=<MseLossBackward>)
output :  tensor([[194907.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(24083402., grad_fn=<MseLossBackward>)
output :  tensor([[215853.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3504e+09, grad_fn=<MseLossBackward>)
output :  tensor([[253809.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(10179988., grad_fn=<MseLossBackward>)
output :  tensor([[182851.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8537e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144191.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7764e+09, grad_fn=<MseLossBackward>)
output :  tensor([[142849.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2725182., grad_fn=<MseLossBackward>)
output :  tensor([[75688.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2737e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137456.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(6036618.5000, grad_fn=<MseLossBackward>)
output :  tensor([[129493.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(352539.0625, grad_fn=<MseLossBackward>)
output :  tensor([[156016.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(4066776.5000, grad_fn=<MseLossBackward>)
output :  tensor([[130214.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(10335120., grad_fn=<MseLossBackward>)
output :  tensor([[77260.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(577718.7500, grad_fn=<MseLossBackward>)
output :  tensor([[82858.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(737143., grad_fn=<MseLossBackward>)
output :  tensor([[240288.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(68705704., grad_fn=<MseLossBackward>)
output :  tensor([[141222.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2497e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129381.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(1250046.2500, grad_fn=<MseLossBackward>)
output :  tensor([[168775.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(3153732., grad_fn=<MseLossBackward>)
output :  tensor([[231108.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(15146326., grad_fn=<MseLossBackward>)
output :  tensor([[186717.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(29400964., grad_fn=<MseLossBackward>)
output :  tensor([[155159.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(705888.7500, grad_fn=<MseLossBackward>)
output :  tensor([[200909.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(9059818., grad_fn=<MseLossBackward>)
output :  tensor([[198464.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4850e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137957.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(915968.6250, grad_fn=<MseLossBackward>)
output :  tensor([[155934.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(873377.8750, grad_fn=<MseLossBackward>)
output :  tensor([[136922.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(851092.7500, grad_fn=<MseLossBackward>)
output :  tensor([[195884.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1639e+09, grad_fn=<MseLossBackward>)
output :  tensor([[154814.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(662697.7500, grad_fn=<MseLossBackward>)
output :  tensor([[140028.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1649e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145142.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(59033.8125, grad_fn=<MseLossBackward>)
output :  tensor([[211950.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2457.9905, grad_fn=<MseLossBackward>)
output :  tensor([[105632.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5850e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166161.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1792628.1250, grad_fn=<MseLossBackward>)
output :  tensor([[127154.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(714513.6250, grad_fn=<MseLossBackward>)
output :  tensor([[145026.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(3894640.5000, grad_fn=<MseLossBackward>)
output :  tensor([[107268.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0147e+09, grad_fn=<MseLossBackward>)
output :  tensor([[141944.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(19755246., grad_fn=<MseLossBackward>)
output :  tensor([[236239.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(57307.8711, grad_fn=<MseLossBackward>)
output :  tensor([[144237.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(581453.9375, grad_fn=<MseLossBackward>)
output :  tensor([[139065.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2450350., grad_fn=<MseLossBackward>)
output :  tensor([[164241.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3134e+09, grad_fn=<MseLossBackward>)
output :  tensor([[263444.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1186e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174773.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(51160.7852, grad_fn=<MseLossBackward>)
output :  tensor([[105922.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(9901937., grad_fn=<MseLossBackward>)
output :  tensor([[198770.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1983e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159750.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(562734.3750, grad_fn=<MseLossBackward>)
output :  tensor([[159678.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7414e+10, grad_fn=<MseLossBackward>)
output :  tensor([[99440.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(1300366., grad_fn=<MseLossBackward>)
output :  tensor([[123701.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(10367.3760, grad_fn=<MseLossBackward>)
output :  tensor([[155801.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(39228.7539, grad_fn=<MseLossBackward>)
output :  tensor([[138705.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1674516.8750, grad_fn=<MseLossBackward>)
output :  tensor([[200343.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(118185.5469, grad_fn=<MseLossBackward>)
output :  tensor([[142466.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(217651.4062, grad_fn=<MseLossBackward>)
output :  tensor([[264122.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3395842.7500, grad_fn=<MseLossBackward>)
output :  tensor([[126663.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1332e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164490.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1019216.4375, grad_fn=<MseLossBackward>)
output :  tensor([[187689.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(656150.6250, grad_fn=<MseLossBackward>)
output :  tensor([[124459.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0908e+08, grad_fn=<MseLossBackward>)
output :  tensor([[245319.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(21905764., grad_fn=<MseLossBackward>)
output :  tensor([[155905.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6689e+08, grad_fn=<MseLossBackward>)
output :  tensor([[243735.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2606559.7500, grad_fn=<MseLossBackward>)
output :  tensor([[141833.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(4694399.5000, grad_fn=<MseLossBackward>)
output :  tensor([[210239.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(57210.6602, grad_fn=<MseLossBackward>)
output :  tensor([[175166.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(7651620.5000, grad_fn=<MseLossBackward>)
output :  tensor([[153017.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(965429.0625, grad_fn=<MseLossBackward>)
output :  tensor([[115910.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(4364378., grad_fn=<MseLossBackward>)
output :  tensor([[236945.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5145e+09, grad_fn=<MseLossBackward>)
output :  tensor([[237922.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(4316266., grad_fn=<MseLossBackward>)
output :  tensor([[151103.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(4989429.5000, grad_fn=<MseLossBackward>)
output :  tensor([[254309.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(348874.8125, grad_fn=<MseLossBackward>)
output :  tensor([[121810.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(53382660., grad_fn=<MseLossBackward>)
output :  tensor([[178794.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(7809143., grad_fn=<MseLossBackward>)
output :  tensor([[163621.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(13117865., grad_fn=<MseLossBackward>)
output :  tensor([[137237.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(38901728., grad_fn=<MseLossBackward>)
output :  tensor([[197412.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6121e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164032.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1086.9385, grad_fn=<MseLossBackward>)
output :  tensor([[165261.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(5112898., grad_fn=<MseLossBackward>)
output :  tensor([[157567.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(187164.3906, grad_fn=<MseLossBackward>)
output :  tensor([[146348.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(12614262., grad_fn=<MseLossBackward>)
output :  tensor([[175006.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2911e+09, grad_fn=<MseLossBackward>)
output :  tensor([[160154.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(23870.2500, grad_fn=<MseLossBackward>)
output :  tensor([[371816.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4772e+08, grad_fn=<MseLossBackward>)
output :  tensor([[123062.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(15500892., grad_fn=<MseLossBackward>)
output :  tensor([[129796.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9622e+09, grad_fn=<MseLossBackward>)
output :  tensor([[278643.]], grad_fn=<AddmmBackward>)
loss:  tensor(6604900., grad_fn=<MseLossBackward>)
output :  tensor([[161769.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(53000.6719, grad_fn=<MseLossBackward>)
output :  tensor([[135410.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2232e+08, grad_fn=<MseLossBackward>)
output :  tensor([[228183.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(14567819., grad_fn=<MseLossBackward>)
output :  tensor([[181125.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(390664.0625, grad_fn=<MseLossBackward>)
output :  tensor([[153932.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(3736066.2500, grad_fn=<MseLossBackward>)
output :  tensor([[145166.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(27779.5137, grad_fn=<MseLossBackward>)
output :  tensor([[155511.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4639e+08, grad_fn=<MseLossBackward>)
output :  tensor([[102151.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(4628280., grad_fn=<MseLossBackward>)
output :  tensor([[81340.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5542e+08, grad_fn=<MseLossBackward>)
output :  tensor([[164204.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(632571.6875, grad_fn=<MseLossBackward>)
output :  tensor([[187106.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6723e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159301.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1693373.5000, grad_fn=<MseLossBackward>)
output :  tensor([[165781.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(68586864., grad_fn=<MseLossBackward>)
output :  tensor([[139016.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2454705.5000, grad_fn=<MseLossBackward>)
output :  tensor([[201889.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(16488802., grad_fn=<MseLossBackward>)
output :  tensor([[139132.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1281494.7500, grad_fn=<MseLossBackward>)
output :  tensor([[182810.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6177e+10, grad_fn=<MseLossBackward>)
output :  tensor([[146271.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(73873.5391, grad_fn=<MseLossBackward>)
output :  tensor([[109714.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1367e+08, grad_fn=<MseLossBackward>)
output :  tensor([[92883.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(1246729.2500, grad_fn=<MseLossBackward>)
output :  tensor([[174657.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(116974.6875, grad_fn=<MseLossBackward>)
output :  tensor([[259976.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(179444.9062, grad_fn=<MseLossBackward>)
output :  tensor([[144128.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(6908108.5000, grad_fn=<MseLossBackward>)
output :  tensor([[158945.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(901965.6875, grad_fn=<MseLossBackward>)
output :  tensor([[134587.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(4359287.5000, grad_fn=<MseLossBackward>)
output :  tensor([[147209.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(5246175.5000, grad_fn=<MseLossBackward>)
output :  tensor([[170584.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(7205869., grad_fn=<MseLossBackward>)
output :  tensor([[129634.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(6940261., grad_fn=<MseLossBackward>)
output :  tensor([[174753.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8530e+08, grad_fn=<MseLossBackward>)
output :  tensor([[159315.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(5359369.5000, grad_fn=<MseLossBackward>)
output :  tensor([[116247.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(63637.9453, grad_fn=<MseLossBackward>)
output :  tensor([[161504.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1116e+09, grad_fn=<MseLossBackward>)
output :  tensor([[52460.2930]], grad_fn=<AddmmBackward>)
loss:  tensor(211869.6094, grad_fn=<MseLossBackward>)
output :  tensor([[232835.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3464e+09, grad_fn=<MseLossBackward>)
output :  tensor([[201615.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(379186.5625, grad_fn=<MseLossBackward>)
output :  tensor([[187442.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(5966493., grad_fn=<MseLossBackward>)
output :  tensor([[107601.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(2563376., grad_fn=<MseLossBackward>)
output :  tensor([[92342.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(28539802., grad_fn=<MseLossBackward>)
output :  tensor([[138409.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2530038.2500, grad_fn=<MseLossBackward>)
output :  tensor([[219193.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5960e+09, grad_fn=<MseLossBackward>)
output :  tensor([[201483.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(36194888., grad_fn=<MseLossBackward>)
output :  tensor([[165802.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(643504.8125, grad_fn=<MseLossBackward>)
output :  tensor([[173081.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4490e+09, grad_fn=<MseLossBackward>)
output :  tensor([[188326.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2799765.5000, grad_fn=<MseLossBackward>)
output :  tensor([[86136.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(744836.4375, grad_fn=<MseLossBackward>)
output :  tensor([[134745.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(27609114., grad_fn=<MseLossBackward>)
output :  tensor([[111271.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(595188.1250, grad_fn=<MseLossBackward>)
output :  tensor([[149275.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7730e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172263.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7026e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194909.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0182e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178913.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1180414.3750, grad_fn=<MseLossBackward>)
output :  tensor([[100461.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(15692616., grad_fn=<MseLossBackward>)
output :  tensor([[117014.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(235270.4688, grad_fn=<MseLossBackward>)
output :  tensor([[158660.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4208e+08, grad_fn=<MseLossBackward>)
output :  tensor([[200485.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(235892.3438, grad_fn=<MseLossBackward>)
output :  tensor([[145815.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(3296097., grad_fn=<MseLossBackward>)
train_loss: [2.6573169e+09]
epoch_result tensor([0.])
output :  tensor([[155404.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(9583184., grad_fn=<MseLossBackward>)
output :  tensor([[124695.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(7263699., grad_fn=<MseLossBackward>)
output :  tensor([[194784.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(340071.2188, grad_fn=<MseLossBackward>)
output :  tensor([[178729.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2992359.5000, grad_fn=<MseLossBackward>)
output :  tensor([[154579.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4854e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131958.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(15666506., grad_fn=<MseLossBackward>)
output :  tensor([[141733.]], grad_fn=<AddmmBackward>)
loss:  tensor(537289., grad_fn=<MseLossBackward>)
output :  tensor([[117872.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(1270181.8750, grad_fn=<MseLossBackward>)
output :  tensor([[67818.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(86839392., grad_fn=<MseLossBackward>)
output :  tensor([[165279.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(519660.7500, grad_fn=<MseLossBackward>)
output :  tensor([[153892.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9299e+08, grad_fn=<MseLossBackward>)
output :  tensor([[223514.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2206896., grad_fn=<MseLossBackward>)
output :  tensor([[167651.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1818494.3750, grad_fn=<MseLossBackward>)
output :  tensor([[251847.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(4612024.5000, grad_fn=<MseLossBackward>)
output :  tensor([[53415.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2509848., grad_fn=<MseLossBackward>)
output :  tensor([[164543.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0175e+08, grad_fn=<MseLossBackward>)
output :  tensor([[170666.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(18775024., grad_fn=<MseLossBackward>)
output :  tensor([[156275.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(50190., grad_fn=<MseLossBackward>)
output :  tensor([[272897.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(4419980.5000, grad_fn=<MseLossBackward>)
output :  tensor([[195286.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2935065., grad_fn=<MseLossBackward>)
output :  tensor([[137569.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5587e+10, grad_fn=<MseLossBackward>)
output :  tensor([[197069.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(10177994., grad_fn=<MseLossBackward>)
output :  tensor([[178223.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1787e+09, grad_fn=<MseLossBackward>)
output :  tensor([[154233.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(10455825., grad_fn=<MseLossBackward>)
output :  tensor([[171636.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2678848.2500, grad_fn=<MseLossBackward>)
output :  tensor([[88093.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(7255657.5000, grad_fn=<MseLossBackward>)
output :  tensor([[168761.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1093e+09, grad_fn=<MseLossBackward>)
output :  tensor([[185065.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(4247.3730, grad_fn=<MseLossBackward>)
output :  tensor([[205087.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5414e+09, grad_fn=<MseLossBackward>)
output :  tensor([[111888.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(3566107.7500, grad_fn=<MseLossBackward>)
output :  tensor([[172669.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2787021.5000, grad_fn=<MseLossBackward>)
output :  tensor([[142746.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(39017592., grad_fn=<MseLossBackward>)
output :  tensor([[131317.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(5369937., grad_fn=<MseLossBackward>)
output :  tensor([[120437.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(878364.3125, grad_fn=<MseLossBackward>)
output :  tensor([[148479.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9094e+08, grad_fn=<MseLossBackward>)
output :  tensor([[171366.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0631e+10, grad_fn=<MseLossBackward>)
output :  tensor([[151028.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1766158., grad_fn=<MseLossBackward>)
output :  tensor([[181236.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1529743.7500, grad_fn=<MseLossBackward>)
output :  tensor([[143619.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(6863663., grad_fn=<MseLossBackward>)
output :  tensor([[108238.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3264e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137131.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0636e+09, grad_fn=<MseLossBackward>)
output :  tensor([[133073.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3712967.7500, grad_fn=<MseLossBackward>)
output :  tensor([[131707.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(22160114., grad_fn=<MseLossBackward>)
output :  tensor([[226589.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2526709., grad_fn=<MseLossBackward>)
output :  tensor([[132548.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(89158.2266, grad_fn=<MseLossBackward>)
output :  tensor([[149054.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(3007.8369, grad_fn=<MseLossBackward>)
output :  tensor([[116770.4922]], grad_fn=<AddmmBackward>)
loss:  tensor(22757596., grad_fn=<MseLossBackward>)
output :  tensor([[160931.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(867750.5000, grad_fn=<MseLossBackward>)
output :  tensor([[146888.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3147e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192727.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(528869.8125, grad_fn=<MseLossBackward>)
output :  tensor([[136062.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2600861.7500, grad_fn=<MseLossBackward>)
output :  tensor([[105113.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(23875592., grad_fn=<MseLossBackward>)
output :  tensor([[233295.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(496276.2188, grad_fn=<MseLossBackward>)
output :  tensor([[164748.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3757e+09, grad_fn=<MseLossBackward>)
output :  tensor([[165755.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(45631292., grad_fn=<MseLossBackward>)
output :  tensor([[203674.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8502e+10, grad_fn=<MseLossBackward>)
output :  tensor([[240667.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2844e+10, grad_fn=<MseLossBackward>)
output :  tensor([[140848.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(7028215., grad_fn=<MseLossBackward>)
output :  tensor([[133157.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(710464.6250, grad_fn=<MseLossBackward>)
output :  tensor([[153262.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(3017386.2500, grad_fn=<MseLossBackward>)
output :  tensor([[130203.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(41358.2148, grad_fn=<MseLossBackward>)
output :  tensor([[182269.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0421e+09, grad_fn=<MseLossBackward>)
output :  tensor([[182069.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(4124834., grad_fn=<MseLossBackward>)
output :  tensor([[163361.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(3466578.5000, grad_fn=<MseLossBackward>)
output :  tensor([[142158.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(708043.3750, grad_fn=<MseLossBackward>)
output :  tensor([[143343.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(711940.4375, grad_fn=<MseLossBackward>)
output :  tensor([[145120.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(14535.3164, grad_fn=<MseLossBackward>)
output :  tensor([[170579.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7757e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194150.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2210e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136303.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(38685.9727, grad_fn=<MseLossBackward>)
output :  tensor([[172765.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(749496., grad_fn=<MseLossBackward>)
output :  tensor([[177515.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(12144898., grad_fn=<MseLossBackward>)
output :  tensor([[116629.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(2655754., grad_fn=<MseLossBackward>)
output :  tensor([[220420.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(335602.9688, grad_fn=<MseLossBackward>)
output :  tensor([[183511.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(129.0354, grad_fn=<MseLossBackward>)
output :  tensor([[126346.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(716535.8125, grad_fn=<MseLossBackward>)
output :  tensor([[199386.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(8330439., grad_fn=<MseLossBackward>)
output :  tensor([[173326.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2476197.2500, grad_fn=<MseLossBackward>)
output :  tensor([[204812.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2919e+10, grad_fn=<MseLossBackward>)
output :  tensor([[209992.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1015402.6250, grad_fn=<MseLossBackward>)
output :  tensor([[170150.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5327e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193603.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(803796.3125, grad_fn=<MseLossBackward>)
output :  tensor([[114166.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1360467.1250, grad_fn=<MseLossBackward>)
output :  tensor([[116017.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(12369344., grad_fn=<MseLossBackward>)
output :  tensor([[110910.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(1188083., grad_fn=<MseLossBackward>)
output :  tensor([[148415.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2608982., grad_fn=<MseLossBackward>)
output :  tensor([[157553.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4258e+10, grad_fn=<MseLossBackward>)
output :  tensor([[177066.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(8603681., grad_fn=<MseLossBackward>)
output :  tensor([[125556.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(3776645.7500, grad_fn=<MseLossBackward>)
output :  tensor([[147304.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(5309928., grad_fn=<MseLossBackward>)
output :  tensor([[183363.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3487e+09, grad_fn=<MseLossBackward>)
output :  tensor([[117213.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(98003.2344, grad_fn=<MseLossBackward>)
output :  tensor([[194254.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(7538885.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145860.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(740756.0625, grad_fn=<MseLossBackward>)
output :  tensor([[207045.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(34272244., grad_fn=<MseLossBackward>)
output :  tensor([[125882.1016]], grad_fn=<AddmmBackward>)
loss:  tensor(13900.0420, grad_fn=<MseLossBackward>)
output :  tensor([[243017.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(28199584., grad_fn=<MseLossBackward>)
output :  tensor([[236836.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3197e+09, grad_fn=<MseLossBackward>)
output :  tensor([[148290.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8529e+08, grad_fn=<MseLossBackward>)
output :  tensor([[83761.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1810e+08, grad_fn=<MseLossBackward>)
output :  tensor([[190236.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1679e+09, grad_fn=<MseLossBackward>)
output :  tensor([[79574.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(2031805.2500, grad_fn=<MseLossBackward>)
output :  tensor([[140050.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(303360., grad_fn=<MseLossBackward>)
output :  tensor([[77609.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(4449001.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144702.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(3060805., grad_fn=<MseLossBackward>)
output :  tensor([[177429.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2043023.5000, grad_fn=<MseLossBackward>)
output :  tensor([[153592.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(8538.9150, grad_fn=<MseLossBackward>)
output :  tensor([[110470.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(9430993., grad_fn=<MseLossBackward>)
output :  tensor([[200244.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3342e+10, grad_fn=<MseLossBackward>)
output :  tensor([[130471.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(3886196.2500, grad_fn=<MseLossBackward>)
output :  tensor([[264534.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3919e+08, grad_fn=<MseLossBackward>)
output :  tensor([[305242.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(22631724., grad_fn=<MseLossBackward>)
output :  tensor([[109274.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(3150486.2500, grad_fn=<MseLossBackward>)
output :  tensor([[170820.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(2820772.7500, grad_fn=<MseLossBackward>)
output :  tensor([[133279.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3904e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129486.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(90513368., grad_fn=<MseLossBackward>)
output :  tensor([[130538.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(83457.7969, grad_fn=<MseLossBackward>)
output :  tensor([[128766.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(14186758., grad_fn=<MseLossBackward>)
output :  tensor([[135932.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9865e+08, grad_fn=<MseLossBackward>)
output :  tensor([[227776.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8112e+10, grad_fn=<MseLossBackward>)
output :  tensor([[185158.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4287e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143925.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(657.4417, grad_fn=<MseLossBackward>)
output :  tensor([[131374.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(15011871., grad_fn=<MseLossBackward>)
output :  tensor([[111383.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(17824.3359, grad_fn=<MseLossBackward>)
output :  tensor([[253147.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2137e+09, grad_fn=<MseLossBackward>)
output :  tensor([[133306.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2867942.2500, grad_fn=<MseLossBackward>)
output :  tensor([[201936.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1131132., grad_fn=<MseLossBackward>)
output :  tensor([[102563.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(5458319.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138673.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1628255.7500, grad_fn=<MseLossBackward>)
output :  tensor([[204091.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1650e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173936.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(35564076., grad_fn=<MseLossBackward>)
output :  tensor([[187546.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(6486970., grad_fn=<MseLossBackward>)
output :  tensor([[164180.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0973e+10, grad_fn=<MseLossBackward>)
output :  tensor([[297121.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4348e+09, grad_fn=<MseLossBackward>)
output :  tensor([[197869.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(926.4414, grad_fn=<MseLossBackward>)
output :  tensor([[260121.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0375e+10, grad_fn=<MseLossBackward>)
output :  tensor([[217200.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3814e+09, grad_fn=<MseLossBackward>)
output :  tensor([[278875.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4535e+09, grad_fn=<MseLossBackward>)
output :  tensor([[223611.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(151102.2656, grad_fn=<MseLossBackward>)
output :  tensor([[219590.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9725e+10, grad_fn=<MseLossBackward>)
output :  tensor([[203582.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(43334860., grad_fn=<MseLossBackward>)
output :  tensor([[158728.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8377e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133644.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1309379.6250, grad_fn=<MseLossBackward>)
output :  tensor([[134692.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(652611.5000, grad_fn=<MseLossBackward>)
output :  tensor([[89742.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1581345.5000, grad_fn=<MseLossBackward>)
output :  tensor([[110713.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(7361005., grad_fn=<MseLossBackward>)
output :  tensor([[273090.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1147e+09, grad_fn=<MseLossBackward>)
output :  tensor([[233591.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1984752.6250, grad_fn=<MseLossBackward>)
output :  tensor([[146695.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2873819.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139691.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(4801371., grad_fn=<MseLossBackward>)
output :  tensor([[175191.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2126265.2500, grad_fn=<MseLossBackward>)
output :  tensor([[151340.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(37089432., grad_fn=<MseLossBackward>)
output :  tensor([[163136.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(9.8365e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165658.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(433272.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135204.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3222529.7500, grad_fn=<MseLossBackward>)
output :  tensor([[190686.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6494e+09, grad_fn=<MseLossBackward>)
output :  tensor([[114042.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(4170593.5000, grad_fn=<MseLossBackward>)
output :  tensor([[165881.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(37431644., grad_fn=<MseLossBackward>)
output :  tensor([[122032.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(4132072.5000, grad_fn=<MseLossBackward>)
output :  tensor([[87415.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(172237.9688, grad_fn=<MseLossBackward>)
output :  tensor([[178147.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3433261.5000, grad_fn=<MseLossBackward>)
output :  tensor([[111248.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(1819021.2500, grad_fn=<MseLossBackward>)
output :  tensor([[239914.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(835824.5000, grad_fn=<MseLossBackward>)
output :  tensor([[248028.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(9172096., grad_fn=<MseLossBackward>)
output :  tensor([[124126.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(28870304., grad_fn=<MseLossBackward>)
output :  tensor([[106727.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(4981022., grad_fn=<MseLossBackward>)
output :  tensor([[284823.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3205e+10, grad_fn=<MseLossBackward>)
output :  tensor([[168615.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(8319078.5000, grad_fn=<MseLossBackward>)
output :  tensor([[125798.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(637003.5000, grad_fn=<MseLossBackward>)
output :  tensor([[143310.]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4060e+08, grad_fn=<MseLossBackward>)
output :  tensor([[200770.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7503e+08, grad_fn=<MseLossBackward>)
output :  tensor([[140675.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(105229.2812, grad_fn=<MseLossBackward>)
output :  tensor([[153420.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6022e+10, grad_fn=<MseLossBackward>)
output :  tensor([[155807.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3639152.2500, grad_fn=<MseLossBackward>)
output :  tensor([[129019.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(231255.7969, grad_fn=<MseLossBackward>)
output :  tensor([[242245.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8565e+10, grad_fn=<MseLossBackward>)
output :  tensor([[397398.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(21176104., grad_fn=<MseLossBackward>)
output :  tensor([[110756.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(3083700.7500, grad_fn=<MseLossBackward>)
output :  tensor([[119479.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(958884.6875, grad_fn=<MseLossBackward>)
output :  tensor([[160352.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(726516.5000, grad_fn=<MseLossBackward>)
output :  tensor([[132690.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5410e+08, grad_fn=<MseLossBackward>)
output :  tensor([[161267.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6884e+09, grad_fn=<MseLossBackward>)
output :  tensor([[175104.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2386e+09, grad_fn=<MseLossBackward>)
output :  tensor([[102352.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1555164.8750, grad_fn=<MseLossBackward>)
output :  tensor([[138275.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(7423581.5000, grad_fn=<MseLossBackward>)
output :  tensor([[365418.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3517031.5000, grad_fn=<MseLossBackward>)
output :  tensor([[198995.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0255e+09, grad_fn=<MseLossBackward>)
output :  tensor([[176545.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1092841.5000, grad_fn=<MseLossBackward>)
output :  tensor([[194766.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(66152552., grad_fn=<MseLossBackward>)
output :  tensor([[136992.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(4031122.7500, grad_fn=<MseLossBackward>)
output :  tensor([[193415.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1176818.1250, grad_fn=<MseLossBackward>)
output :  tensor([[136173.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2217e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176677.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(18686032., grad_fn=<MseLossBackward>)
output :  tensor([[242026.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(723.9463, grad_fn=<MseLossBackward>)
output :  tensor([[176886.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(8329717.5000, grad_fn=<MseLossBackward>)
output :  tensor([[111212.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(10320759., grad_fn=<MseLossBackward>)
output :  tensor([[263636.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(854180.3125, grad_fn=<MseLossBackward>)
output :  tensor([[248246.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(3075803.5000, grad_fn=<MseLossBackward>)
output :  tensor([[123107.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(11657.2510, grad_fn=<MseLossBackward>)
output :  tensor([[211701.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0067e+09, grad_fn=<MseLossBackward>)
output :  tensor([[303397.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7971e+08, grad_fn=<MseLossBackward>)
output :  tensor([[206939.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(3692.4612, grad_fn=<MseLossBackward>)
output :  tensor([[213458.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6013e+10, grad_fn=<MseLossBackward>)
output :  tensor([[161153.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(10583636., grad_fn=<MseLossBackward>)
output :  tensor([[169895.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(8974.6016, grad_fn=<MseLossBackward>)
output :  tensor([[158395.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2141832.2500, grad_fn=<MseLossBackward>)
output :  tensor([[171833.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(3362238., grad_fn=<MseLossBackward>)
output :  tensor([[235977.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0254e+09, grad_fn=<MseLossBackward>)
output :  tensor([[211030.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3951e+08, grad_fn=<MseLossBackward>)
output :  tensor([[161613.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1357e+08, grad_fn=<MseLossBackward>)
output :  tensor([[124904.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(3626793., grad_fn=<MseLossBackward>)
output :  tensor([[176140.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(738632.8125, grad_fn=<MseLossBackward>)
output :  tensor([[176690.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9405e+09, grad_fn=<MseLossBackward>)
output :  tensor([[204476.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6153e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134999.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(322286.8438, grad_fn=<MseLossBackward>)
output :  tensor([[153082.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9113e+08, grad_fn=<MseLossBackward>)
output :  tensor([[280480.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(12110618., grad_fn=<MseLossBackward>)
output :  tensor([[88579.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(12813435., grad_fn=<MseLossBackward>)
output :  tensor([[232393.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(16861546., grad_fn=<MseLossBackward>)
output :  tensor([[256864.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0632e+11, grad_fn=<MseLossBackward>)
output :  tensor([[171312.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1721672., grad_fn=<MseLossBackward>)
output :  tensor([[191768.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8690e+09, grad_fn=<MseLossBackward>)
output :  tensor([[152426.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(6623706.5000, grad_fn=<MseLossBackward>)
output :  tensor([[206009.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0948e+09, grad_fn=<MseLossBackward>)
output :  tensor([[129390.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(152624.5156, grad_fn=<MseLossBackward>)
output :  tensor([[148660.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(13398231., grad_fn=<MseLossBackward>)
output :  tensor([[168070.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5383e+08, grad_fn=<MseLossBackward>)
output :  tensor([[184539.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1716632.2500, grad_fn=<MseLossBackward>)
output :  tensor([[128865.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(8211538., grad_fn=<MseLossBackward>)
output :  tensor([[137471.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(944753.6250, grad_fn=<MseLossBackward>)
output :  tensor([[174294.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1676539.3750, grad_fn=<MseLossBackward>)
output :  tensor([[196722.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8385e+09, grad_fn=<MseLossBackward>)
output :  tensor([[241062.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(3754632.7500, grad_fn=<MseLossBackward>)
output :  tensor([[153224.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(3151512.5000, grad_fn=<MseLossBackward>)
output :  tensor([[199454.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(11932383., grad_fn=<MseLossBackward>)
output :  tensor([[161972.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2300e+08, grad_fn=<MseLossBackward>)
output :  tensor([[191137.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3542e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178830.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1144264.7500, grad_fn=<MseLossBackward>)
output :  tensor([[96639.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(129796.9531, grad_fn=<MseLossBackward>)
output :  tensor([[173281.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1389e+10, grad_fn=<MseLossBackward>)
output :  tensor([[132459.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(6456522., grad_fn=<MseLossBackward>)
output :  tensor([[120946.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(35365600., grad_fn=<MseLossBackward>)
output :  tensor([[168934.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(25660714., grad_fn=<MseLossBackward>)
output :  tensor([[84275.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(524809.6875, grad_fn=<MseLossBackward>)
output :  tensor([[289769.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(53130.2500, grad_fn=<MseLossBackward>)
output :  tensor([[167118.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(4489499., grad_fn=<MseLossBackward>)
output :  tensor([[191383.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0103e+10, grad_fn=<MseLossBackward>)
output :  tensor([[240451.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(9.3319e+08, grad_fn=<MseLossBackward>)
output :  tensor([[152541.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2375692.5000, grad_fn=<MseLossBackward>)
output :  tensor([[124140.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(19832.5605, grad_fn=<MseLossBackward>)
output :  tensor([[114282.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(31554464., grad_fn=<MseLossBackward>)
output :  tensor([[144378.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(8.6310e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172870.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1274746.8750, grad_fn=<MseLossBackward>)
output :  tensor([[112921.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2544e+08, grad_fn=<MseLossBackward>)
output :  tensor([[207125.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2293e+10, grad_fn=<MseLossBackward>)
output :  tensor([[237388.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(16906746., grad_fn=<MseLossBackward>)
output :  tensor([[249088.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1346e+10, grad_fn=<MseLossBackward>)
output :  tensor([[222763.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6361e+08, grad_fn=<MseLossBackward>)
output :  tensor([[194889.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4547e+10, grad_fn=<MseLossBackward>)
output :  tensor([[191205.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(13730962., grad_fn=<MseLossBackward>)
output :  tensor([[205992.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7907e+10, grad_fn=<MseLossBackward>)
output :  tensor([[186091.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2473e+10, grad_fn=<MseLossBackward>)
output :  tensor([[174161.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(20966812., grad_fn=<MseLossBackward>)
output :  tensor([[153613.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(2602222.7500, grad_fn=<MseLossBackward>)
output :  tensor([[335451.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2397658.7500, grad_fn=<MseLossBackward>)
output :  tensor([[207821.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(17458556., grad_fn=<MseLossBackward>)
output :  tensor([[161121.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1257587., grad_fn=<MseLossBackward>)
output :  tensor([[185813.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1010e+09, grad_fn=<MseLossBackward>)
output :  tensor([[104725.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(75320.2266, grad_fn=<MseLossBackward>)
output :  tensor([[271799.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0203e+10, grad_fn=<MseLossBackward>)
output :  tensor([[172424.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2178253.2500, grad_fn=<MseLossBackward>)
output :  tensor([[213132.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(134769.2969, grad_fn=<MseLossBackward>)
output :  tensor([[207136.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9219e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176882.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(5370444., grad_fn=<MseLossBackward>)
output :  tensor([[207971.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(38087604., grad_fn=<MseLossBackward>)
output :  tensor([[155562.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(316933.8125, grad_fn=<MseLossBackward>)
output :  tensor([[152245.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7296e+09, grad_fn=<MseLossBackward>)
output :  tensor([[120083.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(2508635.2500, grad_fn=<MseLossBackward>)
output :  tensor([[138124.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(3518496.7500, grad_fn=<MseLossBackward>)
output :  tensor([[147167.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(3358514.5000, grad_fn=<MseLossBackward>)
output :  tensor([[202114.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5847e+10, grad_fn=<MseLossBackward>)
output :  tensor([[159232.]], grad_fn=<AddmmBackward>)
loss:  tensor(71824., grad_fn=<MseLossBackward>)
output :  tensor([[101230.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(2993575.7500, grad_fn=<MseLossBackward>)
output :  tensor([[223270.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7987e+08, grad_fn=<MseLossBackward>)
output :  tensor([[188136.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1239e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177809.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1755004., grad_fn=<MseLossBackward>)
output :  tensor([[80188.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(3282608., grad_fn=<MseLossBackward>)
output :  tensor([[130964.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(6072374., grad_fn=<MseLossBackward>)
output :  tensor([[216702.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(7303928.5000, grad_fn=<MseLossBackward>)
output :  tensor([[143436.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(317761.2188, grad_fn=<MseLossBackward>)
output :  tensor([[135677.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(32238264., grad_fn=<MseLossBackward>)
output :  tensor([[141461.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1295435.2500, grad_fn=<MseLossBackward>)
output :  tensor([[180428.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8428e+09, grad_fn=<MseLossBackward>)
output :  tensor([[143967.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1063.3713, grad_fn=<MseLossBackward>)
output :  tensor([[160436.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(190736.9219, grad_fn=<MseLossBackward>)
output :  tensor([[211951.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(9294686., grad_fn=<MseLossBackward>)
output :  tensor([[139190.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1690e+09, grad_fn=<MseLossBackward>)
output :  tensor([[254165.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(695582.0625, grad_fn=<MseLossBackward>)
output :  tensor([[158657.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(710280.2500, grad_fn=<MseLossBackward>)
output :  tensor([[127477.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(1045266.6250, grad_fn=<MseLossBackward>)
output :  tensor([[94976.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(544.5660, grad_fn=<MseLossBackward>)
output :  tensor([[154525.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9035e+09, grad_fn=<MseLossBackward>)
output :  tensor([[181316.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2006472.2500, grad_fn=<MseLossBackward>)
output :  tensor([[122500.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(4003782.2500, grad_fn=<MseLossBackward>)
output :  tensor([[186083.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8376e+09, grad_fn=<MseLossBackward>)
output :  tensor([[147474.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6205e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150489.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(347307.6250, grad_fn=<MseLossBackward>)
output :  tensor([[188618.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(754455.1250, grad_fn=<MseLossBackward>)
output :  tensor([[251825.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7017e+09, grad_fn=<MseLossBackward>)
output :  tensor([[91043.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(207993., grad_fn=<MseLossBackward>)
output :  tensor([[244548.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(20687716., grad_fn=<MseLossBackward>)
output :  tensor([[125646.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(8144112., grad_fn=<MseLossBackward>)
output :  tensor([[168069.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(9.5709e+09, grad_fn=<MseLossBackward>)
output :  tensor([[115857.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5145e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179342.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(11171053., grad_fn=<MseLossBackward>)
output :  tensor([[166168.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1653e+08, grad_fn=<MseLossBackward>)
output :  tensor([[158643.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9204e+08, grad_fn=<MseLossBackward>)
output :  tensor([[238152.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(718812.5000, grad_fn=<MseLossBackward>)
output :  tensor([[228946.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4411e+08, grad_fn=<MseLossBackward>)
output :  tensor([[125354.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(2706153.5000, grad_fn=<MseLossBackward>)
output :  tensor([[133041.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(49577440., grad_fn=<MseLossBackward>)
output :  tensor([[222906.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(16754440., grad_fn=<MseLossBackward>)
output :  tensor([[230105.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(15167982., grad_fn=<MseLossBackward>)
output :  tensor([[231052.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(18942624., grad_fn=<MseLossBackward>)
output :  tensor([[147623.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(141917.0156, grad_fn=<MseLossBackward>)
output :  tensor([[214287.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(18382254., grad_fn=<MseLossBackward>)
output :  tensor([[132883.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6598e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134582.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4335244.5000, grad_fn=<MseLossBackward>)
output :  tensor([[308927.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(36869944., grad_fn=<MseLossBackward>)
output :  tensor([[138964.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(4144405.2500, grad_fn=<MseLossBackward>)
output :  tensor([[118638.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6665e+09, grad_fn=<MseLossBackward>)
output :  tensor([[109931.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(186590.2500, grad_fn=<MseLossBackward>)
output :  tensor([[155029.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0522e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180841.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8142e+09, grad_fn=<MseLossBackward>)
output :  tensor([[176363.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(11313763., grad_fn=<MseLossBackward>)
output :  tensor([[190668.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0674e+08, grad_fn=<MseLossBackward>)
output :  tensor([[96861.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(9851212., grad_fn=<MseLossBackward>)
output :  tensor([[176162.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(8051761., grad_fn=<MseLossBackward>)
output :  tensor([[170850.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(8704528., grad_fn=<MseLossBackward>)
output :  tensor([[139634.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(402967.0625, grad_fn=<MseLossBackward>)
output :  tensor([[256364.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0555e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143191.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3863e+09, grad_fn=<MseLossBackward>)
output :  tensor([[171083.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(3671415.2500, grad_fn=<MseLossBackward>)
output :  tensor([[140381.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(145661.5000, grad_fn=<MseLossBackward>)
output :  tensor([[198551.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(3797443.7500, grad_fn=<MseLossBackward>)
output :  tensor([[168274.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2977997.2500, grad_fn=<MseLossBackward>)
output :  tensor([[242497.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2256567.2500, grad_fn=<MseLossBackward>)
output :  tensor([[134401.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(9788.6289, grad_fn=<MseLossBackward>)
output :  tensor([[151466.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(4479307.5000, grad_fn=<MseLossBackward>)
output :  tensor([[215333.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(111295.2188, grad_fn=<MseLossBackward>)
output :  tensor([[160159.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(23433012., grad_fn=<MseLossBackward>)
output :  tensor([[190452.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2110936.5000, grad_fn=<MseLossBackward>)
output :  tensor([[137168.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7660e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129180.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(32608.4590, grad_fn=<MseLossBackward>)
output :  tensor([[137860.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(4578262.5000, grad_fn=<MseLossBackward>)
output :  tensor([[197932.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1218e+09, grad_fn=<MseLossBackward>)
output :  tensor([[165484.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5487e+09, grad_fn=<MseLossBackward>)
output :  tensor([[78912.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5768e+08, grad_fn=<MseLossBackward>)
output :  tensor([[93836.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(87174464., grad_fn=<MseLossBackward>)
output :  tensor([[257954.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(21725066., grad_fn=<MseLossBackward>)
output :  tensor([[203256.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1289e+09, grad_fn=<MseLossBackward>)
output :  tensor([[115236.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(56113.4688, grad_fn=<MseLossBackward>)
output :  tensor([[159181.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0194e+08, grad_fn=<MseLossBackward>)
output :  tensor([[207484.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5663e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177788.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5029e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157151.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(4627742., grad_fn=<MseLossBackward>)
output :  tensor([[171198.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1435391.2500, grad_fn=<MseLossBackward>)
output :  tensor([[114014.4922]], grad_fn=<AddmmBackward>)
loss:  tensor(971225.6250, grad_fn=<MseLossBackward>)
output :  tensor([[163524.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(72667104., grad_fn=<MseLossBackward>)
output :  tensor([[192666.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0259e+08, grad_fn=<MseLossBackward>)
output :  tensor([[219272.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(51841.5977, grad_fn=<MseLossBackward>)
output :  tensor([[244566.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5043e+11, grad_fn=<MseLossBackward>)
output :  tensor([[148954.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(3820253.5000, grad_fn=<MseLossBackward>)
output :  tensor([[110416.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(3749941.5000, grad_fn=<MseLossBackward>)
output :  tensor([[170668.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2616e+08, grad_fn=<MseLossBackward>)
output :  tensor([[152148.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2718428., grad_fn=<MseLossBackward>)
output :  tensor([[233777.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(10383499., grad_fn=<MseLossBackward>)
output :  tensor([[116839.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3384795., grad_fn=<MseLossBackward>)
output :  tensor([[183194.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(86509.5156, grad_fn=<MseLossBackward>)
output :  tensor([[185344.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1838397., grad_fn=<MseLossBackward>)
output :  tensor([[165136.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3983e+10, grad_fn=<MseLossBackward>)
output :  tensor([[95888.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2167e+08, grad_fn=<MseLossBackward>)
output :  tensor([[238460.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(290689.4688, grad_fn=<MseLossBackward>)
output :  tensor([[177806.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3263442.2500, grad_fn=<MseLossBackward>)
output :  tensor([[141814.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(3292013.2500, grad_fn=<MseLossBackward>)
output :  tensor([[232691.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(5328378.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162591.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(167204.3281, grad_fn=<MseLossBackward>)
output :  tensor([[200439.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5515e+10, grad_fn=<MseLossBackward>)
output :  tensor([[138489.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(12177810., grad_fn=<MseLossBackward>)
output :  tensor([[185422.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4861e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137112.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1237273.8750, grad_fn=<MseLossBackward>)
output :  tensor([[228065.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(62962984., grad_fn=<MseLossBackward>)
output :  tensor([[222055.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8089e+08, grad_fn=<MseLossBackward>)
output :  tensor([[93084.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(9514237., grad_fn=<MseLossBackward>)
output :  tensor([[160933.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2248922., grad_fn=<MseLossBackward>)
output :  tensor([[243467.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6233e+10, grad_fn=<MseLossBackward>)
output :  tensor([[146237.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1531483.6250, grad_fn=<MseLossBackward>)
output :  tensor([[109335.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7923e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164457.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1815.5588, grad_fn=<MseLossBackward>)
output :  tensor([[142373.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2646874.7500, grad_fn=<MseLossBackward>)
output :  tensor([[129769.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(2462226.7500, grad_fn=<MseLossBackward>)
output :  tensor([[189171.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8760e+09, grad_fn=<MseLossBackward>)
output :  tensor([[123173.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(454107.5000, grad_fn=<MseLossBackward>)
output :  tensor([[150369.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2658275.5000, grad_fn=<MseLossBackward>)
output :  tensor([[167067.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(21929026., grad_fn=<MseLossBackward>)
output :  tensor([[152132.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1282414.7500, grad_fn=<MseLossBackward>)
output :  tensor([[160929.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(3881885., grad_fn=<MseLossBackward>)
output :  tensor([[135208.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8690e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133019.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1039284.6875, grad_fn=<MseLossBackward>)
output :  tensor([[157198.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3117e+08, grad_fn=<MseLossBackward>)
output :  tensor([[144052.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(9853.6641, grad_fn=<MseLossBackward>)
output :  tensor([[163117.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1869073.5000, grad_fn=<MseLossBackward>)
output :  tensor([[141919.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0253e+09, grad_fn=<MseLossBackward>)
output :  tensor([[149381.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(337633.6250, grad_fn=<MseLossBackward>)
output :  tensor([[185733.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(5135393.5000, grad_fn=<MseLossBackward>)
output :  tensor([[169556.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(309866.1875, grad_fn=<MseLossBackward>)
output :  tensor([[179248.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(564447., grad_fn=<MseLossBackward>)
output :  tensor([[223215.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(10337933., grad_fn=<MseLossBackward>)
output :  tensor([[110184.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(5218369., grad_fn=<MseLossBackward>)
output :  tensor([[136887.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4370e+08, grad_fn=<MseLossBackward>)
output :  tensor([[284972.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1055242.5000, grad_fn=<MseLossBackward>)
output :  tensor([[120106.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(16859750., grad_fn=<MseLossBackward>)
output :  tensor([[179604.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6318e+09, grad_fn=<MseLossBackward>)
output :  tensor([[188292.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(10841276., grad_fn=<MseLossBackward>)
output :  tensor([[185786.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(82342.0938, grad_fn=<MseLossBackward>)
output :  tensor([[248204.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1802e+08, grad_fn=<MseLossBackward>)
output :  tensor([[221746.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(64468.3828, grad_fn=<MseLossBackward>)
output :  tensor([[131664.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6381e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176460.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5037e+08, grad_fn=<MseLossBackward>)
output :  tensor([[122850.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1320272.8750, grad_fn=<MseLossBackward>)
output :  tensor([[180918.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6492e+10, grad_fn=<MseLossBackward>)
output :  tensor([[151452.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2393934.2500, grad_fn=<MseLossBackward>)
output :  tensor([[156271.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(95474272., grad_fn=<MseLossBackward>)
output :  tensor([[205211.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1185036.3750, grad_fn=<MseLossBackward>)
output :  tensor([[145387.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6609e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175144.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(731532.7500, grad_fn=<MseLossBackward>)
output :  tensor([[248989.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(9.3091e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148637.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(406864.5938, grad_fn=<MseLossBackward>)
output :  tensor([[202442.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(49694.1641, grad_fn=<MseLossBackward>)
output :  tensor([[165049.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(26006972., grad_fn=<MseLossBackward>)
output :  tensor([[125878.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4348e+09, grad_fn=<MseLossBackward>)
output :  tensor([[133418.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(5435528., grad_fn=<MseLossBackward>)
output :  tensor([[180658.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(11163952., grad_fn=<MseLossBackward>)
output :  tensor([[194619.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(21342668., grad_fn=<MseLossBackward>)
output :  tensor([[220739.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6595e+09, grad_fn=<MseLossBackward>)
output :  tensor([[252370.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(21427930., grad_fn=<MseLossBackward>)
output :  tensor([[183437.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8377e+10, grad_fn=<MseLossBackward>)
output :  tensor([[142747.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6263e+09, grad_fn=<MseLossBackward>)
output :  tensor([[148580.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(16654433., grad_fn=<MseLossBackward>)
output :  tensor([[72930.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0844e+09, grad_fn=<MseLossBackward>)
output :  tensor([[128251.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(45548156., grad_fn=<MseLossBackward>)
output :  tensor([[126848.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(4210447.5000, grad_fn=<MseLossBackward>)
output :  tensor([[157098.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(9601186., grad_fn=<MseLossBackward>)
output :  tensor([[127848.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(719594.3125, grad_fn=<MseLossBackward>)
output :  tensor([[76472.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(747.6807, grad_fn=<MseLossBackward>)
output :  tensor([[82988.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(976622.6250, grad_fn=<MseLossBackward>)
output :  tensor([[226377.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(31617778., grad_fn=<MseLossBackward>)
output :  tensor([[141052.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1526e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135772.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(27798762., grad_fn=<MseLossBackward>)
output :  tensor([[169864.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(8207867., grad_fn=<MseLossBackward>)
output :  tensor([[236273.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1622638.1250, grad_fn=<MseLossBackward>)
output :  tensor([[190436.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2902285., grad_fn=<MseLossBackward>)
output :  tensor([[159617.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(13086419., grad_fn=<MseLossBackward>)
output :  tensor([[196524.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1890839.8750, grad_fn=<MseLossBackward>)
output :  tensor([[198251.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5015e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137696.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(485482.3438, grad_fn=<MseLossBackward>)
output :  tensor([[154500.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(249734.4531, grad_fn=<MseLossBackward>)
output :  tensor([[136580.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(337270.5625, grad_fn=<MseLossBackward>)
output :  tensor([[197664.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0456e+09, grad_fn=<MseLossBackward>)
output :  tensor([[154490.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(240375.7031, grad_fn=<MseLossBackward>)
output :  tensor([[136711.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8672e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144185.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(510398.6250, grad_fn=<MseLossBackward>)
output :  tensor([[205617.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(40741092., grad_fn=<MseLossBackward>)
output :  tensor([[105437.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4932e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166166.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1779431., grad_fn=<MseLossBackward>)
output :  tensor([[130356.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(5553939., grad_fn=<MseLossBackward>)
output :  tensor([[147546.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(299174.8125, grad_fn=<MseLossBackward>)
output :  tensor([[105440.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8539e+09, grad_fn=<MseLossBackward>)
output :  tensor([[141182.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(13562763., grad_fn=<MseLossBackward>)
output :  tensor([[235909.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(8278.1562, grad_fn=<MseLossBackward>)
output :  tensor([[145270.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(73373.2656, grad_fn=<MseLossBackward>)
output :  tensor([[139794.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(5263439.5000, grad_fn=<MseLossBackward>)
output :  tensor([[167119.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5304e+09, grad_fn=<MseLossBackward>)
output :  tensor([[260694.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9947e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176870.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3497250.7500, grad_fn=<MseLossBackward>)
output :  tensor([[103089.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(98203.8906, grad_fn=<MseLossBackward>)
output :  tensor([[198903.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1775e+09, grad_fn=<MseLossBackward>)
output :  tensor([[160627.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2647993.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162068.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6379e+10, grad_fn=<MseLossBackward>)
output :  tensor([[96702.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2550608.7500, grad_fn=<MseLossBackward>)
output :  tensor([[121855.1016]], grad_fn=<AddmmBackward>)
loss:  tensor(3044670.5000, grad_fn=<MseLossBackward>)
output :  tensor([[158372.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(5629646., grad_fn=<MseLossBackward>)
output :  tensor([[141623.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2635295.7500, grad_fn=<MseLossBackward>)
output :  tensor([[200265.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(70697.8281, grad_fn=<MseLossBackward>)
output :  tensor([[142795.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(633267.8125, grad_fn=<MseLossBackward>)
output :  tensor([[263122.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(709964.2500, grad_fn=<MseLossBackward>)
output :  tensor([[130772.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4268e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163161.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(5467851.5000, grad_fn=<MseLossBackward>)
output :  tensor([[189010.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(260530.4844, grad_fn=<MseLossBackward>)
output :  tensor([[122730.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6207e+08, grad_fn=<MseLossBackward>)
output :  tensor([[255132.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(26343358., grad_fn=<MseLossBackward>)
output :  tensor([[157673.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(8.6003e+08, grad_fn=<MseLossBackward>)
output :  tensor([[241307.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(16345217., grad_fn=<MseLossBackward>)
output :  tensor([[144671.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(451248.0625, grad_fn=<MseLossBackward>)
output :  tensor([[206224.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(14251333., grad_fn=<MseLossBackward>)
output :  tensor([[172752.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(124289.2969, grad_fn=<MseLossBackward>)
output :  tensor([[155753.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3076461.2500, grad_fn=<MseLossBackward>)
output :  tensor([[117227.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(596418.3125, grad_fn=<MseLossBackward>)
output :  tensor([[234275.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7893e+09, grad_fn=<MseLossBackward>)
output :  tensor([[234198.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(33654864., grad_fn=<MseLossBackward>)
output :  tensor([[150200.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(9837632., grad_fn=<MseLossBackward>)
output :  tensor([[253428.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2165450.2500, grad_fn=<MseLossBackward>)
output :  tensor([[123712.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(84793592., grad_fn=<MseLossBackward>)
output :  tensor([[175869.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(16973.2031, grad_fn=<MseLossBackward>)
output :  tensor([[158969.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1061865.8750, grad_fn=<MseLossBackward>)
output :  tensor([[134651.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(13335620., grad_fn=<MseLossBackward>)
output :  tensor([[197281.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5943e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163173.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(683076.4375, grad_fn=<MseLossBackward>)
output :  tensor([[161637.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1856917.2500, grad_fn=<MseLossBackward>)
output :  tensor([[158274.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(75127.3828, grad_fn=<MseLossBackward>)
output :  tensor([[155651.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(33075260., grad_fn=<MseLossBackward>)
output :  tensor([[174548.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2313e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161944.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(3782782., grad_fn=<MseLossBackward>)
output :  tensor([[373882.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0177e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131312.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(18595230., grad_fn=<MseLossBackward>)
output :  tensor([[131121.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0813e+09, grad_fn=<MseLossBackward>)
output :  tensor([[279669.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2381813.5000, grad_fn=<MseLossBackward>)
output :  tensor([[160484.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2297877., grad_fn=<MseLossBackward>)
output :  tensor([[131411.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1907e+08, grad_fn=<MseLossBackward>)
output :  tensor([[238850.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(46922928., grad_fn=<MseLossBackward>)
output :  tensor([[181617.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1249504.7500, grad_fn=<MseLossBackward>)
output :  tensor([[153519.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2309545., grad_fn=<MseLossBackward>)
output :  tensor([[145411.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(169563.7969, grad_fn=<MseLossBackward>)
output :  tensor([[155058.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2975e+08, grad_fn=<MseLossBackward>)
output :  tensor([[102406.1016]], grad_fn=<AddmmBackward>)
loss:  tensor(5789324.5000, grad_fn=<MseLossBackward>)
output :  tensor([[82133.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8987e+08, grad_fn=<MseLossBackward>)
output :  tensor([[164718.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(79215.8594, grad_fn=<MseLossBackward>)
output :  tensor([[187538.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6372e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159529.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2338749., grad_fn=<MseLossBackward>)
output :  tensor([[154211.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(10816493., grad_fn=<MseLossBackward>)
output :  tensor([[139358.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(3642074., grad_fn=<MseLossBackward>)
output :  tensor([[203135.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(7922553.5000, grad_fn=<MseLossBackward>)
output :  tensor([[137838.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(26168.1172, grad_fn=<MseLossBackward>)
output :  tensor([[181670.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6468e+10, grad_fn=<MseLossBackward>)
output :  tensor([[141954.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(16368978., grad_fn=<MseLossBackward>)
output :  tensor([[109465.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0042e+08, grad_fn=<MseLossBackward>)
output :  tensor([[97491.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(12190736., grad_fn=<MseLossBackward>)
output :  tensor([[173269.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2995549.7500, grad_fn=<MseLossBackward>)
output :  tensor([[270339.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(98784344., grad_fn=<MseLossBackward>)
output :  tensor([[141264.]], grad_fn=<AddmmBackward>)
loss:  tensor(55696., grad_fn=<MseLossBackward>)
output :  tensor([[157965.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3723090.7500, grad_fn=<MseLossBackward>)
output :  tensor([[129981.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(6343747.5000, grad_fn=<MseLossBackward>)
output :  tensor([[149694.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(37787.7148, grad_fn=<MseLossBackward>)
output :  tensor([[165828.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(4291112., grad_fn=<MseLossBackward>)
output :  tensor([[130231.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(10439765., grad_fn=<MseLossBackward>)
output :  tensor([[174617.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7721e+08, grad_fn=<MseLossBackward>)
output :  tensor([[156860.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(19591.2500, grad_fn=<MseLossBackward>)
output :  tensor([[120423.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(15394097., grad_fn=<MseLossBackward>)
output :  tensor([[162558.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9621e+09, grad_fn=<MseLossBackward>)
output :  tensor([[49504.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(6225726.5000, grad_fn=<MseLossBackward>)
output :  tensor([[232724.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3641e+09, grad_fn=<MseLossBackward>)
output :  tensor([[201387.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(150398.5312, grad_fn=<MseLossBackward>)
output :  tensor([[182878.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(4499768., grad_fn=<MseLossBackward>)
output :  tensor([[107573.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(2475238.5000, grad_fn=<MseLossBackward>)
output :  tensor([[91351.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(18932832., grad_fn=<MseLossBackward>)
output :  tensor([[153246.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7548e+08, grad_fn=<MseLossBackward>)
output :  tensor([[219417.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5625e+09, grad_fn=<MseLossBackward>)
output :  tensor([[201465.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(36413116., grad_fn=<MseLossBackward>)
output :  tensor([[163696.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1699071.5000, grad_fn=<MseLossBackward>)
output :  tensor([[170775.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8782e+09, grad_fn=<MseLossBackward>)
output :  tensor([[190066.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(4445.1387, grad_fn=<MseLossBackward>)
output :  tensor([[89070.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(4286485., grad_fn=<MseLossBackward>)
output :  tensor([[142759.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(7615530., grad_fn=<MseLossBackward>)
output :  tensor([[108327.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4721386., grad_fn=<MseLossBackward>)
output :  tensor([[147601.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3551e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173358.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7942e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192483.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5666e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179435.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(318201.7500, grad_fn=<MseLossBackward>)
output :  tensor([[97077.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(333533.3125, grad_fn=<MseLossBackward>)
output :  tensor([[116399.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1211375.3750, grad_fn=<MseLossBackward>)
output :  tensor([[160400.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5695e+08, grad_fn=<MseLossBackward>)
output :  tensor([[200145.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(21083.9473, grad_fn=<MseLossBackward>)
output :  tensor([[142437.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2441943.5000, grad_fn=<MseLossBackward>)
train_loss: [2.661646e+09]
epoch_result tensor([0.])
output :  tensor([[157670.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(687474.1875, grad_fn=<MseLossBackward>)
output :  tensor([[121635.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(133128.0625, grad_fn=<MseLossBackward>)
output :  tensor([[192939.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1591815.8750, grad_fn=<MseLossBackward>)
output :  tensor([[178414.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1999882.1250, grad_fn=<MseLossBackward>)
output :  tensor([[154784.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3897e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129194.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1426681., grad_fn=<MseLossBackward>)
output :  tensor([[139469.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2343865.2500, grad_fn=<MseLossBackward>)
output :  tensor([[118504.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(245427.3594, grad_fn=<MseLossBackward>)
output :  tensor([[68289.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(95841656., grad_fn=<MseLossBackward>)
output :  tensor([[167894.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3590492., grad_fn=<MseLossBackward>)
output :  tensor([[144172.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(17408322., grad_fn=<MseLossBackward>)
output :  tensor([[225455.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(207551.4219, grad_fn=<MseLossBackward>)
output :  tensor([[170147.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1316612.8750, grad_fn=<MseLossBackward>)
output :  tensor([[249778.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(6113.2852, grad_fn=<MseLossBackward>)
output :  tensor([[57153.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(4636250., grad_fn=<MseLossBackward>)
output :  tensor([[165261.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3103e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180681.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(32282106., grad_fn=<MseLossBackward>)
output :  tensor([[173671.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9486e+08, grad_fn=<MseLossBackward>)
output :  tensor([[275701.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(491620.0938, grad_fn=<MseLossBackward>)
output :  tensor([[197493.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(243696.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138179.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5252e+10, grad_fn=<MseLossBackward>)
output :  tensor([[193688.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(36302.1562, grad_fn=<MseLossBackward>)
output :  tensor([[180528.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9689e+09, grad_fn=<MseLossBackward>)
output :  tensor([[152788.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(3198900., grad_fn=<MseLossBackward>)
output :  tensor([[169568.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(185963.0938, grad_fn=<MseLossBackward>)
output :  tensor([[83368.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(4128039.7500, grad_fn=<MseLossBackward>)
output :  tensor([[169535.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1963e+09, grad_fn=<MseLossBackward>)
output :  tensor([[186956.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3829543.2500, grad_fn=<MseLossBackward>)
output :  tensor([[203103.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7454e+09, grad_fn=<MseLossBackward>)
output :  tensor([[109588.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(169390.1250, grad_fn=<MseLossBackward>)
output :  tensor([[169856.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1307949.6250, grad_fn=<MseLossBackward>)
output :  tensor([[137282.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(611597.3125, grad_fn=<MseLossBackward>)
output :  tensor([[126995.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(4018552.7500, grad_fn=<MseLossBackward>)
output :  tensor([[120100.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(360262.5625, grad_fn=<MseLossBackward>)
output :  tensor([[147814.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(9.4956e+08, grad_fn=<MseLossBackward>)
output :  tensor([[171100.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0707e+10, grad_fn=<MseLossBackward>)
output :  tensor([[151746.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(4187778.5000, grad_fn=<MseLossBackward>)
output :  tensor([[180522.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(272794.0312, grad_fn=<MseLossBackward>)
output :  tensor([[141951.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(905500.9375, grad_fn=<MseLossBackward>)
output :  tensor([[104609.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1345e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136496.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1629e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137430.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(5906798.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138979.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4351e+08, grad_fn=<MseLossBackward>)
output :  tensor([[223691.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1713440.1250, grad_fn=<MseLossBackward>)
output :  tensor([[132858.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(370291.2812, grad_fn=<MseLossBackward>)
output :  tensor([[148667.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(110577.0312, grad_fn=<MseLossBackward>)
output :  tensor([[113914.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(3664143.7500, grad_fn=<MseLossBackward>)
output :  tensor([[163290.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(10826876., grad_fn=<MseLossBackward>)
output :  tensor([[145007.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4993e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194375.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(5641367., grad_fn=<MseLossBackward>)
output :  tensor([[137904.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(11934110., grad_fn=<MseLossBackward>)
output :  tensor([[112969.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(8815750., grad_fn=<MseLossBackward>)
output :  tensor([[231084.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(8500049., grad_fn=<MseLossBackward>)
output :  tensor([[163615.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4874e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157280.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2958077.5000, grad_fn=<MseLossBackward>)
output :  tensor([[206488.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7560e+10, grad_fn=<MseLossBackward>)
output :  tensor([[243382.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2236e+10, grad_fn=<MseLossBackward>)
output :  tensor([[142175.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1753513.8750, grad_fn=<MseLossBackward>)
output :  tensor([[141261.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(52728700., grad_fn=<MseLossBackward>)
output :  tensor([[157094.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(4387388.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135244.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(27508222., grad_fn=<MseLossBackward>)
output :  tensor([[182165.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0581e+09, grad_fn=<MseLossBackward>)
output :  tensor([[183080.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1039220.9375, grad_fn=<MseLossBackward>)
output :  tensor([[159663.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(3373880.2500, grad_fn=<MseLossBackward>)
output :  tensor([[153075.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0151e+08, grad_fn=<MseLossBackward>)
output :  tensor([[141486.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1026485.5625, grad_fn=<MseLossBackward>)
output :  tensor([[137290.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(59443136., grad_fn=<MseLossBackward>)
output :  tensor([[172952.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4534e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194400.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1073e+08, grad_fn=<MseLossBackward>)
output :  tensor([[140235.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(13951275., grad_fn=<MseLossBackward>)
output :  tensor([[169902.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(3991567., grad_fn=<MseLossBackward>)
output :  tensor([[178061.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(8633221., grad_fn=<MseLossBackward>)
output :  tensor([[114465.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(285456.4688, grad_fn=<MseLossBackward>)
output :  tensor([[222156.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1337709.1250, grad_fn=<MseLossBackward>)
output :  tensor([[180334.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(10020687., grad_fn=<MseLossBackward>)
output :  tensor([[127806.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(5320447., grad_fn=<MseLossBackward>)
output :  tensor([[196699.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(39663.2109, grad_fn=<MseLossBackward>)
output :  tensor([[172960.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(3763418.2500, grad_fn=<MseLossBackward>)
output :  tensor([[207980.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1780e+10, grad_fn=<MseLossBackward>)
output :  tensor([[209615.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1916753.7500, grad_fn=<MseLossBackward>)
output :  tensor([[168938.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4393e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193461.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1078871.7500, grad_fn=<MseLossBackward>)
output :  tensor([[114297.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1683100.7500, grad_fn=<MseLossBackward>)
output :  tensor([[114571.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(4290885.5000, grad_fn=<MseLossBackward>)
output :  tensor([[114348.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(5516700., grad_fn=<MseLossBackward>)
output :  tensor([[144054.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(7539314.5000, grad_fn=<MseLossBackward>)
output :  tensor([[159174.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3661e+10, grad_fn=<MseLossBackward>)
output :  tensor([[180419.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(175849.1875, grad_fn=<MseLossBackward>)
output :  tensor([[126624.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(767334.9375, grad_fn=<MseLossBackward>)
output :  tensor([[144081.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(843843.1875, grad_fn=<MseLossBackward>)
output :  tensor([[183393.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3516e+09, grad_fn=<MseLossBackward>)
output :  tensor([[119912.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(9073321., grad_fn=<MseLossBackward>)
output :  tensor([[198078.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1162387.2500, grad_fn=<MseLossBackward>)
output :  tensor([[147811.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(7903917., grad_fn=<MseLossBackward>)
output :  tensor([[213988.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1185512.6250, grad_fn=<MseLossBackward>)
output :  tensor([[128829.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(8003904., grad_fn=<MseLossBackward>)
output :  tensor([[248379.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2652.2500, grad_fn=<MseLossBackward>)
output :  tensor([[233842.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6171e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151669.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1085e+08, grad_fn=<MseLossBackward>)
output :  tensor([[85784.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1430e+08, grad_fn=<MseLossBackward>)
output :  tensor([[189204.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3437e+09, grad_fn=<MseLossBackward>)
output :  tensor([[81508.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(258667.6094, grad_fn=<MseLossBackward>)
output :  tensor([[140173.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(453602.2500, grad_fn=<MseLossBackward>)
output :  tensor([[77365.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(3480177.7500, grad_fn=<MseLossBackward>)
output :  tensor([[145742.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(7782618., grad_fn=<MseLossBackward>)
output :  tensor([[173982.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(4070054., grad_fn=<MseLossBackward>)
output :  tensor([[153916.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(173563.3750, grad_fn=<MseLossBackward>)
output :  tensor([[109076.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(2809421.2500, grad_fn=<MseLossBackward>)
output :  tensor([[203546.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2590e+10, grad_fn=<MseLossBackward>)
output :  tensor([[125936.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(6570290.5000, grad_fn=<MseLossBackward>)
output :  tensor([[270944.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(81997552., grad_fn=<MseLossBackward>)
output :  tensor([[302378.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(58086308., grad_fn=<MseLossBackward>)
output :  tensor([[106453.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(1096127.2500, grad_fn=<MseLossBackward>)
output :  tensor([[168585.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(15323310., grad_fn=<MseLossBackward>)
output :  tensor([[133398.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4507e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137474.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2327674.7500, grad_fn=<MseLossBackward>)
output :  tensor([[130246.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(15.5655, grad_fn=<MseLossBackward>)
output :  tensor([[127231.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(4979592., grad_fn=<MseLossBackward>)
output :  tensor([[134897.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4503e+08, grad_fn=<MseLossBackward>)
output :  tensor([[227105.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8375e+10, grad_fn=<MseLossBackward>)
output :  tensor([[188930.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3125e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145488.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2524772., grad_fn=<MseLossBackward>)
output :  tensor([[125730.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(3130549.7500, grad_fn=<MseLossBackward>)
output :  tensor([[115702.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(19824618., grad_fn=<MseLossBackward>)
output :  tensor([[254181.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0806e+09, grad_fn=<MseLossBackward>)
output :  tensor([[135142.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(20328.5215, grad_fn=<MseLossBackward>)
output :  tensor([[203995.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(991953.7500, grad_fn=<MseLossBackward>)
output :  tensor([[106673.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(3146355.2500, grad_fn=<MseLossBackward>)
output :  tensor([[142432.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(6161798., grad_fn=<MseLossBackward>)
output :  tensor([[202622.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7862e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180217.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(100687.2188, grad_fn=<MseLossBackward>)
output :  tensor([[185438.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(192035.6719, grad_fn=<MseLossBackward>)
output :  tensor([[162717.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1399e+10, grad_fn=<MseLossBackward>)
output :  tensor([[294864.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6108e+09, grad_fn=<MseLossBackward>)
output :  tensor([[197619.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(78750.3906, grad_fn=<MseLossBackward>)
output :  tensor([[259307.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0608e+10, grad_fn=<MseLossBackward>)
output :  tensor([[216175.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4825e+09, grad_fn=<MseLossBackward>)
output :  tensor([[279172.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4309e+09, grad_fn=<MseLossBackward>)
output :  tensor([[223793.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(42622.8945, grad_fn=<MseLossBackward>)
output :  tensor([[224174.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8165e+10, grad_fn=<MseLossBackward>)
output :  tensor([[197244.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(59948.4609, grad_fn=<MseLossBackward>)
output :  tensor([[159760.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(9.4622e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130291.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(4879543., grad_fn=<MseLossBackward>)
output :  tensor([[135049.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(202598.4531, grad_fn=<MseLossBackward>)
output :  tensor([[93242.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(5029857.5000, grad_fn=<MseLossBackward>)
output :  tensor([[108738.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(546074.8125, grad_fn=<MseLossBackward>)
output :  tensor([[270255.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4392e+09, grad_fn=<MseLossBackward>)
output :  tensor([[232111.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(8341717.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145469.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(220474.2656, grad_fn=<MseLossBackward>)
output :  tensor([[135819.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2824500.5000, grad_fn=<MseLossBackward>)
output :  tensor([[172721.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1023037.4375, grad_fn=<MseLossBackward>)
output :  tensor([[147713.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(6071219., grad_fn=<MseLossBackward>)
output :  tensor([[163244.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(9.7688e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166213.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1473113.2500, grad_fn=<MseLossBackward>)
output :  tensor([[137637.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(406007.9062, grad_fn=<MseLossBackward>)
output :  tensor([[189331.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4665e+09, grad_fn=<MseLossBackward>)
output :  tensor([[112017.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(322.8760, grad_fn=<MseLossBackward>)
output :  tensor([[168615.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(11456956., grad_fn=<MseLossBackward>)
output :  tensor([[116607.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(11506777., grad_fn=<MseLossBackward>)
output :  tensor([[86664.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(112638.8984, grad_fn=<MseLossBackward>)
output :  tensor([[179431.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(322801.5312, grad_fn=<MseLossBackward>)
output :  tensor([[110007.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(11502.5625, grad_fn=<MseLossBackward>)
output :  tensor([[237703.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1680831.2500, grad_fn=<MseLossBackward>)
output :  tensor([[245838.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(703527.7500, grad_fn=<MseLossBackward>)
output :  tensor([[132821.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(11032570., grad_fn=<MseLossBackward>)
output :  tensor([[112535.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(12793252., grad_fn=<MseLossBackward>)
output :  tensor([[285502.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2998e+10, grad_fn=<MseLossBackward>)
output :  tensor([[168350.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(9918858., grad_fn=<MseLossBackward>)
output :  tensor([[124374.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(390918.0312, grad_fn=<MseLossBackward>)
output :  tensor([[143635.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5719e+08, grad_fn=<MseLossBackward>)
output :  tensor([[203179.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1709e+08, grad_fn=<MseLossBackward>)
output :  tensor([[140712.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(82719.1562, grad_fn=<MseLossBackward>)
output :  tensor([[155234.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5567e+10, grad_fn=<MseLossBackward>)
output :  tensor([[150245.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(13354114., grad_fn=<MseLossBackward>)
output :  tensor([[130274.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(599741.3125, grad_fn=<MseLossBackward>)
output :  tensor([[243184.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8310e+10, grad_fn=<MseLossBackward>)
output :  tensor([[399841.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(4658178., grad_fn=<MseLossBackward>)
output :  tensor([[112869.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(14971579., grad_fn=<MseLossBackward>)
output :  tensor([[109731.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(76887144., grad_fn=<MseLossBackward>)
output :  tensor([[157782.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2948411., grad_fn=<MseLossBackward>)
output :  tensor([[131663.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9891e+08, grad_fn=<MseLossBackward>)
output :  tensor([[162263.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5684e+09, grad_fn=<MseLossBackward>)
output :  tensor([[175322.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2670e+09, grad_fn=<MseLossBackward>)
output :  tensor([[105947.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(5512774., grad_fn=<MseLossBackward>)
output :  tensor([[141178.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(31828.7891, grad_fn=<MseLossBackward>)
output :  tensor([[366990.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(92055.3516, grad_fn=<MseLossBackward>)
output :  tensor([[200629.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8484e+09, grad_fn=<MseLossBackward>)
output :  tensor([[175784.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(80975.8125, grad_fn=<MseLossBackward>)
output :  tensor([[202014.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(784303.9375, grad_fn=<MseLossBackward>)
output :  tensor([[140372.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1882469.7500, grad_fn=<MseLossBackward>)
output :  tensor([[195312.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(660918.1875, grad_fn=<MseLossBackward>)
output :  tensor([[136008.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1273e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180251.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(560930.8125, grad_fn=<MseLossBackward>)
output :  tensor([[237410.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(21063798., grad_fn=<MseLossBackward>)
output :  tensor([[176786.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(7762405.5000, grad_fn=<MseLossBackward>)
output :  tensor([[109148.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1318585.7500, grad_fn=<MseLossBackward>)
output :  tensor([[265101.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(292038.9062, grad_fn=<MseLossBackward>)
output :  tensor([[251305.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1704942.2500, grad_fn=<MseLossBackward>)
output :  tensor([[123384.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(147966.4375, grad_fn=<MseLossBackward>)
output :  tensor([[213073.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8348e+09, grad_fn=<MseLossBackward>)
output :  tensor([[303117.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9206e+08, grad_fn=<MseLossBackward>)
output :  tensor([[207373.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(139373.8906, grad_fn=<MseLossBackward>)
output :  tensor([[211801.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6435e+10, grad_fn=<MseLossBackward>)
output :  tensor([[159081.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1395536.1250, grad_fn=<MseLossBackward>)
output :  tensor([[170052.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(3869.2288, grad_fn=<MseLossBackward>)
output :  tensor([[159477.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(6478059., grad_fn=<MseLossBackward>)
output :  tensor([[168515.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2204668.2500, grad_fn=<MseLossBackward>)
output :  tensor([[234979.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0904e+09, grad_fn=<MseLossBackward>)
output :  tensor([[216790.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6041e+08, grad_fn=<MseLossBackward>)
output :  tensor([[161660.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1494e+08, grad_fn=<MseLossBackward>)
output :  tensor([[123134.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(17976.9434, grad_fn=<MseLossBackward>)
output :  tensor([[176147.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(727449.0625, grad_fn=<MseLossBackward>)
output :  tensor([[178806.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5923e+09, grad_fn=<MseLossBackward>)
output :  tensor([[203087.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6684e+10, grad_fn=<MseLossBackward>)
output :  tensor([[132619.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(3283457.2500, grad_fn=<MseLossBackward>)
output :  tensor([[153291.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0043e+09, grad_fn=<MseLossBackward>)
output :  tensor([[278138.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1297249.8750, grad_fn=<MseLossBackward>)
output :  tensor([[86839.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3385542.5000, grad_fn=<MseLossBackward>)
output :  tensor([[237775.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1626063.2500, grad_fn=<MseLossBackward>)
output :  tensor([[257487.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0591e+11, grad_fn=<MseLossBackward>)
output :  tensor([[167569.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(5905128., grad_fn=<MseLossBackward>)
output :  tensor([[192457.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8099e+09, grad_fn=<MseLossBackward>)
output :  tensor([[154014.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(971826.3125, grad_fn=<MseLossBackward>)
output :  tensor([[204873.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2414e+09, grad_fn=<MseLossBackward>)
output :  tensor([[127521.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2185084.5000, grad_fn=<MseLossBackward>)
output :  tensor([[149602.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(21182000., grad_fn=<MseLossBackward>)
output :  tensor([[171710.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5323e+08, grad_fn=<MseLossBackward>)
output :  tensor([[184541.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1710986.6250, grad_fn=<MseLossBackward>)
output :  tensor([[127413.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1999175.1250, grad_fn=<MseLossBackward>)
output :  tensor([[138732.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(4985312., grad_fn=<MseLossBackward>)
output :  tensor([[168974.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(16207418., grad_fn=<MseLossBackward>)
output :  tensor([[199595.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5406e+09, grad_fn=<MseLossBackward>)
output :  tensor([[240320.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(7181144., grad_fn=<MseLossBackward>)
output :  tensor([[154024.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(952179.5625, grad_fn=<MseLossBackward>)
output :  tensor([[199940.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(15524585., grad_fn=<MseLossBackward>)
output :  tensor([[163504.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8043e+08, grad_fn=<MseLossBackward>)
output :  tensor([[192287.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6352e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177438.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(6060213., grad_fn=<MseLossBackward>)
output :  tensor([[97600.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(360281.3125, grad_fn=<MseLossBackward>)
output :  tensor([[171877.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1690e+10, grad_fn=<MseLossBackward>)
output :  tensor([[135483.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(233832.6875, grad_fn=<MseLossBackward>)
output :  tensor([[125783.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1629e+08, grad_fn=<MseLossBackward>)
output :  tensor([[171828.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(4716566., grad_fn=<MseLossBackward>)
output :  tensor([[90699.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(32487506., grad_fn=<MseLossBackward>)
output :  tensor([[292078.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(4321591.5000, grad_fn=<MseLossBackward>)
output :  tensor([[166717.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2951202., grad_fn=<MseLossBackward>)
output :  tensor([[191135.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0173e+10, grad_fn=<MseLossBackward>)
output :  tensor([[243233.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7097e+08, grad_fn=<MseLossBackward>)
output :  tensor([[147168.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(14682428., grad_fn=<MseLossBackward>)
output :  tensor([[122128.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(3502190.5000, grad_fn=<MseLossBackward>)
output :  tensor([[121630.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2995441.5000, grad_fn=<MseLossBackward>)
output :  tensor([[147359.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0471e+09, grad_fn=<MseLossBackward>)
output :  tensor([[175712.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2931800., grad_fn=<MseLossBackward>)
output :  tensor([[116021.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1237e+09, grad_fn=<MseLossBackward>)
output :  tensor([[204958.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2778e+10, grad_fn=<MseLossBackward>)
output :  tensor([[242513.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1026802.2500, grad_fn=<MseLossBackward>)
output :  tensor([[247725.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1746e+10, grad_fn=<MseLossBackward>)
output :  tensor([[220051.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5906e+08, grad_fn=<MseLossBackward>)
output :  tensor([[193179.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4962e+10, grad_fn=<MseLossBackward>)
output :  tensor([[185691.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3272368., grad_fn=<MseLossBackward>)
output :  tensor([[208520.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6807e+10, grad_fn=<MseLossBackward>)
output :  tensor([[189700.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1404e+10, grad_fn=<MseLossBackward>)
output :  tensor([[176199.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(6452949.5000, grad_fn=<MseLossBackward>)
output :  tensor([[151386.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(376746.5938, grad_fn=<MseLossBackward>)
output :  tensor([[331801.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(27022452., grad_fn=<MseLossBackward>)
output :  tensor([[207717.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(18342750., grad_fn=<MseLossBackward>)
output :  tensor([[157958.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(4167148., grad_fn=<MseLossBackward>)
output :  tensor([[184928.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2004e+09, grad_fn=<MseLossBackward>)
output :  tensor([[108734.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(13946374., grad_fn=<MseLossBackward>)
output :  tensor([[270112.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1161e+10, grad_fn=<MseLossBackward>)
output :  tensor([[170270.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(13175539., grad_fn=<MseLossBackward>)
output :  tensor([[215421.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(3691621.7500, grad_fn=<MseLossBackward>)
output :  tensor([[204789.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6279e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178481.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(516826.1875, grad_fn=<MseLossBackward>)
output :  tensor([[201335.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(215978.0469, grad_fn=<MseLossBackward>)
output :  tensor([[153247.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3070270.5000, grad_fn=<MseLossBackward>)
output :  tensor([[150290.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5292e+09, grad_fn=<MseLossBackward>)
output :  tensor([[118182.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(101104.1250, grad_fn=<MseLossBackward>)
output :  tensor([[141305.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1705554.3750, grad_fn=<MseLossBackward>)
output :  tensor([[146045.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(8730086., grad_fn=<MseLossBackward>)
output :  tensor([[200423.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6276e+10, grad_fn=<MseLossBackward>)
output :  tensor([[161782.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(5211661., grad_fn=<MseLossBackward>)
output :  tensor([[102630.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(9800617., grad_fn=<MseLossBackward>)
output :  tensor([[225231.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1811e+08, grad_fn=<MseLossBackward>)
output :  tensor([[185126.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8518e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177924.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2073150., grad_fn=<MseLossBackward>)
output :  tensor([[82950.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(902603.9375, grad_fn=<MseLossBackward>)
output :  tensor([[128501.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2833, grad_fn=<MseLossBackward>)
output :  tensor([[214400.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(160525.4375, grad_fn=<MseLossBackward>)
output :  tensor([[143123.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(768553.5625, grad_fn=<MseLossBackward>)
output :  tensor([[133045.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(9276879., grad_fn=<MseLossBackward>)
output :  tensor([[146001.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(11571478., grad_fn=<MseLossBackward>)
output :  tensor([[178424.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6748e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145063.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1130367.6250, grad_fn=<MseLossBackward>)
output :  tensor([[160968.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(937326.5000, grad_fn=<MseLossBackward>)
output :  tensor([[211235.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(14168519., grad_fn=<MseLossBackward>)
output :  tensor([[137970.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0870e+09, grad_fn=<MseLossBackward>)
output :  tensor([[255766.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(586995.3750, grad_fn=<MseLossBackward>)
output :  tensor([[161565.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(4267194., grad_fn=<MseLossBackward>)
output :  tensor([[130922.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(5869604., grad_fn=<MseLossBackward>)
output :  tensor([[95946.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(896113.6875, grad_fn=<MseLossBackward>)
output :  tensor([[155995.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1116e+09, grad_fn=<MseLossBackward>)
output :  tensor([[179125.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(599801.8750, grad_fn=<MseLossBackward>)
output :  tensor([[121851.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(1827291.3750, grad_fn=<MseLossBackward>)
output :  tensor([[185296.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9056e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145159.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3111e+09, grad_fn=<MseLossBackward>)
output :  tensor([[148841.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1119595.5000, grad_fn=<MseLossBackward>)
output :  tensor([[187196.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(306293.0625, grad_fn=<MseLossBackward>)
output :  tensor([[250789.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7883e+09, grad_fn=<MseLossBackward>)
output :  tensor([[93125.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2642453.5000, grad_fn=<MseLossBackward>)
output :  tensor([[236904.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(9580282., grad_fn=<MseLossBackward>)
output :  tensor([[125736.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(7639393.5000, grad_fn=<MseLossBackward>)
output :  tensor([[165474.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0085e+10, grad_fn=<MseLossBackward>)
output :  tensor([[115140.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2922e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178007.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(4028300., grad_fn=<MseLossBackward>)
output :  tensor([[164365.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2326e+08, grad_fn=<MseLossBackward>)
output :  tensor([[155156.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0794e+08, grad_fn=<MseLossBackward>)
output :  tensor([[235485.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(12351051., grad_fn=<MseLossBackward>)
output :  tensor([[225857.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0332e+09, grad_fn=<MseLossBackward>)
output :  tensor([[129356.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(5551104., grad_fn=<MseLossBackward>)
output :  tensor([[127743.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(3038866., grad_fn=<MseLossBackward>)
output :  tensor([[222170.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(23319996., grad_fn=<MseLossBackward>)
output :  tensor([[228608.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(29067092., grad_fn=<MseLossBackward>)
output :  tensor([[226683.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(272.2500, grad_fn=<MseLossBackward>)
output :  tensor([[150425.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(5881004., grad_fn=<MseLossBackward>)
output :  tensor([[209444.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(308493.4688, grad_fn=<MseLossBackward>)
output :  tensor([[132469.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5549e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134563.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(4257452., grad_fn=<MseLossBackward>)
output :  tensor([[308157.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(46816812., grad_fn=<MseLossBackward>)
output :  tensor([[140437.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(316371.0938, grad_fn=<MseLossBackward>)
output :  tensor([[119854.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7936e+09, grad_fn=<MseLossBackward>)
output :  tensor([[107218.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(5203638., grad_fn=<MseLossBackward>)
output :  tensor([[154072.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3958e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177788.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(9.3967e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174223.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1495767.2500, grad_fn=<MseLossBackward>)
output :  tensor([[190603.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0808e+08, grad_fn=<MseLossBackward>)
output :  tensor([[102996.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(8979480., grad_fn=<MseLossBackward>)
output :  tensor([[176198.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(7847527., grad_fn=<MseLossBackward>)
output :  tensor([[175942.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(64680800., grad_fn=<MseLossBackward>)
output :  tensor([[137429.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2465243.5000, grad_fn=<MseLossBackward>)
output :  tensor([[262900.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2543e+09, grad_fn=<MseLossBackward>)
output :  tensor([[141985.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2474e+09, grad_fn=<MseLossBackward>)
output :  tensor([[176485.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(12147730., grad_fn=<MseLossBackward>)
output :  tensor([[135993.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(16049789., grad_fn=<MseLossBackward>)
output :  tensor([[203447.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(8688585., grad_fn=<MseLossBackward>)
output :  tensor([[169134.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(748711.6250, grad_fn=<MseLossBackward>)
output :  tensor([[240092.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(15266480., grad_fn=<MseLossBackward>)
output :  tensor([[133572.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(860836.0625, grad_fn=<MseLossBackward>)
output :  tensor([[152785.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(11805022., grad_fn=<MseLossBackward>)
output :  tensor([[209909.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(25910804., grad_fn=<MseLossBackward>)
output :  tensor([[162616.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(5682860., grad_fn=<MseLossBackward>)
output :  tensor([[184795.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(17677032., grad_fn=<MseLossBackward>)
output :  tensor([[134146.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1771e+08, grad_fn=<MseLossBackward>)
output :  tensor([[125988.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(9067250., grad_fn=<MseLossBackward>)
output :  tensor([[142828.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(8000058.5000, grad_fn=<MseLossBackward>)
output :  tensor([[199884.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8463e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166563.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6588e+09, grad_fn=<MseLossBackward>)
output :  tensor([[77321.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0004e+08, grad_fn=<MseLossBackward>)
output :  tensor([[93647.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(83683760., grad_fn=<MseLossBackward>)
output :  tensor([[252505.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(619910.1875, grad_fn=<MseLossBackward>)
output :  tensor([[202498.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0321e+09, grad_fn=<MseLossBackward>)
output :  tensor([[114088.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(831644.2500, grad_fn=<MseLossBackward>)
output :  tensor([[158761.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2590e+08, grad_fn=<MseLossBackward>)
output :  tensor([[205330.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1518e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176127.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8120e+09, grad_fn=<MseLossBackward>)
output :  tensor([[156946.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(3788254., grad_fn=<MseLossBackward>)
output :  tensor([[168600.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1958906.3750, grad_fn=<MseLossBackward>)
output :  tensor([[116137.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1295008.5000, grad_fn=<MseLossBackward>)
output :  tensor([[164608.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(92326872., grad_fn=<MseLossBackward>)
output :  tensor([[192095.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1918e+08, grad_fn=<MseLossBackward>)
output :  tensor([[222818.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(11010161., grad_fn=<MseLossBackward>)
output :  tensor([[242350.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5266e+11, grad_fn=<MseLossBackward>)
output :  tensor([[142767.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(17915512., grad_fn=<MseLossBackward>)
output :  tensor([[109453.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(948630.3750, grad_fn=<MseLossBackward>)
output :  tensor([[167967.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9410e+08, grad_fn=<MseLossBackward>)
output :  tensor([[153366.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(8215210., grad_fn=<MseLossBackward>)
output :  tensor([[233795.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(10266217., grad_fn=<MseLossBackward>)
output :  tensor([[115778.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(605721.6875, grad_fn=<MseLossBackward>)
output :  tensor([[184261.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1853597.1250, grad_fn=<MseLossBackward>)
output :  tensor([[189627.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(8568427., grad_fn=<MseLossBackward>)
output :  tensor([[164831.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4077e+10, grad_fn=<MseLossBackward>)
output :  tensor([[95511.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1057e+08, grad_fn=<MseLossBackward>)
output :  tensor([[241012.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(4051414.2500, grad_fn=<MseLossBackward>)
output :  tensor([[176762.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(581215.6250, grad_fn=<MseLossBackward>)
output :  tensor([[139930.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(4851.9932, grad_fn=<MseLossBackward>)
output :  tensor([[233361.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2684938.2500, grad_fn=<MseLossBackward>)
output :  tensor([[161268.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2998417., grad_fn=<MseLossBackward>)
output :  tensor([[199931.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5642e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134205.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(630758.6250, grad_fn=<MseLossBackward>)
output :  tensor([[184617.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1155e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135406.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(352427.7500, grad_fn=<MseLossBackward>)
output :  tensor([[224165.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4006e+08, grad_fn=<MseLossBackward>)
output :  tensor([[223905.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8094e+08, grad_fn=<MseLossBackward>)
output :  tensor([[89147.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(727115.9375, grad_fn=<MseLossBackward>)
output :  tensor([[161444.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(4043932.5000, grad_fn=<MseLossBackward>)
output :  tensor([[244854.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5882e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144736.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(69498.1406, grad_fn=<MseLossBackward>)
output :  tensor([[110348.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8791e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163432.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1139923.2500, grad_fn=<MseLossBackward>)
output :  tensor([[147381.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(11432746., grad_fn=<MseLossBackward>)
output :  tensor([[127083.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1247165.5000, grad_fn=<MseLossBackward>)
output :  tensor([[188591.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9574e+09, grad_fn=<MseLossBackward>)
output :  tensor([[124010.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2280430.2500, grad_fn=<MseLossBackward>)
output :  tensor([[153097.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1204574.8750, grad_fn=<MseLossBackward>)
output :  tensor([[169534.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(4910379., grad_fn=<MseLossBackward>)
output :  tensor([[148478.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(6356938., grad_fn=<MseLossBackward>)
output :  tensor([[160398.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(6256486., grad_fn=<MseLossBackward>)
output :  tensor([[135531.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0393e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134024.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4096639.2500, grad_fn=<MseLossBackward>)
output :  tensor([[156922.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2122e+08, grad_fn=<MseLossBackward>)
output :  tensor([[145843.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2860590.7500, grad_fn=<MseLossBackward>)
output :  tensor([[161430.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(102070.2656, grad_fn=<MseLossBackward>)
output :  tensor([[142444.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0591e+09, grad_fn=<MseLossBackward>)
output :  tensor([[147944.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(732147.6250, grad_fn=<MseLossBackward>)
output :  tensor([[186978.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1043047.3125, grad_fn=<MseLossBackward>)
output :  tensor([[170687.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2846865.2500, grad_fn=<MseLossBackward>)
output :  tensor([[180708.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(502326.5625, grad_fn=<MseLossBackward>)
output :  tensor([[223329.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(11087027., grad_fn=<MseLossBackward>)
output :  tensor([[112217.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(18639862., grad_fn=<MseLossBackward>)
output :  tensor([[139218.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0501e+08, grad_fn=<MseLossBackward>)
output :  tensor([[287982.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3929934.5000, grad_fn=<MseLossBackward>)
output :  tensor([[119904.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(15243290., grad_fn=<MseLossBackward>)
output :  tensor([[176611.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8825e+09, grad_fn=<MseLossBackward>)
output :  tensor([[184873.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(16053.6816, grad_fn=<MseLossBackward>)
output :  tensor([[179774.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(32786002., grad_fn=<MseLossBackward>)
output :  tensor([[250289.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1061e+08, grad_fn=<MseLossBackward>)
output :  tensor([[220965.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1071095.6250, grad_fn=<MseLossBackward>)
output :  tensor([[132101.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8651e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176085.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3295e+08, grad_fn=<MseLossBackward>)
output :  tensor([[126099.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(4409573.5000, grad_fn=<MseLossBackward>)
output :  tensor([[183128.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5358e+10, grad_fn=<MseLossBackward>)
output :  tensor([[151940.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1121580.2500, grad_fn=<MseLossBackward>)
output :  tensor([[154316.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(61092056., grad_fn=<MseLossBackward>)
output :  tensor([[206200.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(9856.7666, grad_fn=<MseLossBackward>)
output :  tensor([[144242.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3789e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176689.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(475819.7188, grad_fn=<MseLossBackward>)
output :  tensor([[252100.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5076e+08, grad_fn=<MseLossBackward>)
output :  tensor([[146889.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1232759.1250, grad_fn=<MseLossBackward>)
output :  tensor([[204014.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1822078.1250, grad_fn=<MseLossBackward>)
output :  tensor([[158126.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(3325665.2500, grad_fn=<MseLossBackward>)
output :  tensor([[126600.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4900e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136912.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1351442.6250, grad_fn=<MseLossBackward>)
output :  tensor([[186091.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(4373784., grad_fn=<MseLossBackward>)
output :  tensor([[194882.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(23836212., grad_fn=<MseLossBackward>)
output :  tensor([[216367.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2755e+09, grad_fn=<MseLossBackward>)
output :  tensor([[256165.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(696494.5625, grad_fn=<MseLossBackward>)
output :  tensor([[182788.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8554e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145253.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8895e+09, grad_fn=<MseLossBackward>)
output :  tensor([[148549.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(16396299., grad_fn=<MseLossBackward>)
output :  tensor([[76947.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3651e+09, grad_fn=<MseLossBackward>)
output :  tensor([[141097.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(37179124., grad_fn=<MseLossBackward>)
output :  tensor([[132066.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(10029592., grad_fn=<MseLossBackward>)
output :  tensor([[154650.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(423617.9375, grad_fn=<MseLossBackward>)
output :  tensor([[123920.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(9483801., grad_fn=<MseLossBackward>)
output :  tensor([[79602.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(9628318., grad_fn=<MseLossBackward>)
output :  tensor([[82511.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(261488.4062, grad_fn=<MseLossBackward>)
output :  tensor([[241431.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(88949952., grad_fn=<MseLossBackward>)
output :  tensor([[139684.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3899e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129858.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(410941.0938, grad_fn=<MseLossBackward>)
output :  tensor([[169653.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(7039155., grad_fn=<MseLossBackward>)
output :  tensor([[233142.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(3450538.5000, grad_fn=<MseLossBackward>)
output :  tensor([[185226.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(47799724., grad_fn=<MseLossBackward>)
output :  tensor([[157032.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1065991.7500, grad_fn=<MseLossBackward>)
output :  tensor([[200420.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(6351187.5000, grad_fn=<MseLossBackward>)
output :  tensor([[198412.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4890e+09, grad_fn=<MseLossBackward>)
output :  tensor([[133610.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(11491676., grad_fn=<MseLossBackward>)
output :  tensor([[155298.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(89018.3203, grad_fn=<MseLossBackward>)
output :  tensor([[135138.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(741347.9375, grad_fn=<MseLossBackward>)
output :  tensor([[196594.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1159e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150310.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(13612526., grad_fn=<MseLossBackward>)
output :  tensor([[141206.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2759e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144378.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(271783., grad_fn=<MseLossBackward>)
output :  tensor([[210820.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1390999.1250, grad_fn=<MseLossBackward>)
output :  tensor([[106200.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8568e+08, grad_fn=<MseLossBackward>)
output :  tensor([[169374.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3515566.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128304.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(92563.3125, grad_fn=<MseLossBackward>)
output :  tensor([[146095.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(818798.7500, grad_fn=<MseLossBackward>)
output :  tensor([[108154.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0951e+09, grad_fn=<MseLossBackward>)
output :  tensor([[140237.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(7493649.5000, grad_fn=<MseLossBackward>)
output :  tensor([[239896.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(15181738., grad_fn=<MseLossBackward>)
output :  tensor([[143153.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(3409331.5000, grad_fn=<MseLossBackward>)
output :  tensor([[141279.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(14284856., grad_fn=<MseLossBackward>)
output :  tensor([[163638.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2701e+09, grad_fn=<MseLossBackward>)
output :  tensor([[265820.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4834e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176776.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(3155397., grad_fn=<MseLossBackward>)
output :  tensor([[104494.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(2953484., grad_fn=<MseLossBackward>)
output :  tensor([[197998.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3205e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161446.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(5986662., grad_fn=<MseLossBackward>)
output :  tensor([[161356.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6686e+10, grad_fn=<MseLossBackward>)
output :  tensor([[96553.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(3048925.2500, grad_fn=<MseLossBackward>)
output :  tensor([[123973.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(139385.5625, grad_fn=<MseLossBackward>)
output :  tensor([[157023.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1047040.5625, grad_fn=<MseLossBackward>)
output :  tensor([[142110.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(4452364., grad_fn=<MseLossBackward>)
output :  tensor([[199933.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(4360.1260, grad_fn=<MseLossBackward>)
output :  tensor([[142312.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(97392.7578, grad_fn=<MseLossBackward>)
output :  tensor([[260805.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2174979.7500, grad_fn=<MseLossBackward>)
output :  tensor([[129233.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3129e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164379.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1255205.1250, grad_fn=<MseLossBackward>)
output :  tensor([[188339.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(25730.1641, grad_fn=<MseLossBackward>)
output :  tensor([[121670.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3620e+08, grad_fn=<MseLossBackward>)
output :  tensor([[248840.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1345418.7500, grad_fn=<MseLossBackward>)
output :  tensor([[156381.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(9.3750e+08, grad_fn=<MseLossBackward>)
output :  tensor([[243199.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(4623709.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144509.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(259956.5781, grad_fn=<MseLossBackward>)
output :  tensor([[208473.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2330106.7500, grad_fn=<MseLossBackward>)
output :  tensor([[174253.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(3435636., grad_fn=<MseLossBackward>)
output :  tensor([[154017.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(300.2639, grad_fn=<MseLossBackward>)
output :  tensor([[120862.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(8194622., grad_fn=<MseLossBackward>)
output :  tensor([[235682.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6428e+09, grad_fn=<MseLossBackward>)
output :  tensor([[238043.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3827892.2500, grad_fn=<MseLossBackward>)
output :  tensor([[150616.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(7399080., grad_fn=<MseLossBackward>)
output :  tensor([[256771.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3502980.2500, grad_fn=<MseLossBackward>)
output :  tensor([[122566.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(65000380., grad_fn=<MseLossBackward>)
output :  tensor([[178902.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(8421967., grad_fn=<MseLossBackward>)
output :  tensor([[161716.]], grad_fn=<AddmmBackward>)
loss:  tensor(2944656., grad_fn=<MseLossBackward>)
output :  tensor([[136278.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(27865862., grad_fn=<MseLossBackward>)
output :  tensor([[198609.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7762e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166873.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(8259517., grad_fn=<MseLossBackward>)
output :  tensor([[163491.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(241556.8906, grad_fn=<MseLossBackward>)
output :  tensor([[157312.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(472162.2500, grad_fn=<MseLossBackward>)
output :  tensor([[145003.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(23972806., grad_fn=<MseLossBackward>)
output :  tensor([[173859.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1421e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159103.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(804412.8125, grad_fn=<MseLossBackward>)
output :  tensor([[372671.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2765e+08, grad_fn=<MseLossBackward>)
output :  tensor([[124356.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(6986646.5000, grad_fn=<MseLossBackward>)
output :  tensor([[127830.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7919e+09, grad_fn=<MseLossBackward>)
output :  tensor([[278566.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(7003300.5000, grad_fn=<MseLossBackward>)
output :  tensor([[165980.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(15840898., grad_fn=<MseLossBackward>)
output :  tensor([[131860.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2905e+08, grad_fn=<MseLossBackward>)
output :  tensor([[230285.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2938760.2500, grad_fn=<MseLossBackward>)
output :  tensor([[176901.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(12946616., grad_fn=<MseLossBackward>)
output :  tensor([[151697.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(91411.7422, grad_fn=<MseLossBackward>)
output :  tensor([[144483.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(267014.4062, grad_fn=<MseLossBackward>)
output :  tensor([[155853.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5925e+08, grad_fn=<MseLossBackward>)
output :  tensor([[100489.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(239809.1562, grad_fn=<MseLossBackward>)
output :  tensor([[80204.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0823e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166317.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1734818.2500, grad_fn=<MseLossBackward>)
output :  tensor([[185670.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7918e+09, grad_fn=<MseLossBackward>)
output :  tensor([[156905.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1197246.2500, grad_fn=<MseLossBackward>)
output :  tensor([[153972.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(12441493., grad_fn=<MseLossBackward>)
output :  tensor([[136390.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1122672.7500, grad_fn=<MseLossBackward>)
output :  tensor([[210603.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(21652590., grad_fn=<MseLossBackward>)
output :  tensor([[138593.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(352260.8125, grad_fn=<MseLossBackward>)
output :  tensor([[180093.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6876e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145915.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(7121.7773, grad_fn=<MseLossBackward>)
output :  tensor([[111191.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9476e+08, grad_fn=<MseLossBackward>)
output :  tensor([[94786.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(618938.6875, grad_fn=<MseLossBackward>)
output :  tensor([[174762.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(56517.6328, grad_fn=<MseLossBackward>)
output :  tensor([[260866.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(217563.9375, grad_fn=<MseLossBackward>)
output :  tensor([[142365.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(748603.5000, grad_fn=<MseLossBackward>)
output :  tensor([[161177.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1644245.2500, grad_fn=<MseLossBackward>)
output :  tensor([[132135.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(132734.9844, grad_fn=<MseLossBackward>)
output :  tensor([[148469.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1061254.1250, grad_fn=<MseLossBackward>)
output :  tensor([[171240.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(11160819., grad_fn=<MseLossBackward>)
output :  tensor([[128220.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1490497.6250, grad_fn=<MseLossBackward>)
output :  tensor([[175300.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(9.1814e+08, grad_fn=<MseLossBackward>)
output :  tensor([[159301.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(5296255., grad_fn=<MseLossBackward>)
output :  tensor([[116837.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(114117.2812, grad_fn=<MseLossBackward>)
output :  tensor([[163255.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8642e+09, grad_fn=<MseLossBackward>)
output :  tensor([[52181.5430]], grad_fn=<AddmmBackward>)
loss:  tensor(32957.8477, grad_fn=<MseLossBackward>)
output :  tensor([[231385.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5796e+09, grad_fn=<MseLossBackward>)
output :  tensor([[200227.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(596876.9375, grad_fn=<MseLossBackward>)
output :  tensor([[185941.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(885745.6875, grad_fn=<MseLossBackward>)
output :  tensor([[106452.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(205152.3750, grad_fn=<MseLossBackward>)
output :  tensor([[90295.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(10862380., grad_fn=<MseLossBackward>)
output :  tensor([[140636.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(404655., grad_fn=<MseLossBackward>)
output :  tensor([[218684.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6724e+09, grad_fn=<MseLossBackward>)
output :  tensor([[198034.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(89586816., grad_fn=<MseLossBackward>)
output :  tensor([[173889.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(79019600., grad_fn=<MseLossBackward>)
output :  tensor([[172277.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5975e+09, grad_fn=<MseLossBackward>)
output :  tensor([[187646.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(5537050., grad_fn=<MseLossBackward>)
output :  tensor([[88994.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(3978996.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139493.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(256858.9062, grad_fn=<MseLossBackward>)
output :  tensor([[110802.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(91303.1172, grad_fn=<MseLossBackward>)
output :  tensor([[149281.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7746e+08, grad_fn=<MseLossBackward>)
output :  tensor([[171847.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6685e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194526.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0969e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179394.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(366176.2500, grad_fn=<MseLossBackward>)
output :  tensor([[96924.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(180498.8438, grad_fn=<MseLossBackward>)
output :  tensor([[119517.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(4071157.5000, grad_fn=<MseLossBackward>)
output :  tensor([[159740.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8850e+08, grad_fn=<MseLossBackward>)
output :  tensor([[199319.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(462676.2812, grad_fn=<MseLossBackward>)
output :  tensor([[146027.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(4109109., grad_fn=<MseLossBackward>)
train_loss: [2.6575107e+09]
epoch_result tensor([0.])
output :  tensor([[159441.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(885716.2500, grad_fn=<MseLossBackward>)
output :  tensor([[121084.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(838197.5000, grad_fn=<MseLossBackward>)
output :  tensor([[193829.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(138116.7500, grad_fn=<MseLossBackward>)
output :  tensor([[178847.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(3414064.5000, grad_fn=<MseLossBackward>)
output :  tensor([[153991.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7641e+08, grad_fn=<MseLossBackward>)
output :  tensor([[126620.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1903278.8750, grad_fn=<MseLossBackward>)
output :  tensor([[140563.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(190695.9688, grad_fn=<MseLossBackward>)
output :  tensor([[118363.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(405062.6250, grad_fn=<MseLossBackward>)
output :  tensor([[69594.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2309e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165394.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(366876.2812, grad_fn=<MseLossBackward>)
output :  tensor([[141396.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1949339.5000, grad_fn=<MseLossBackward>)
output :  tensor([[225068.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(4720.1191, grad_fn=<MseLossBackward>)
output :  tensor([[168027.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(945513.1250, grad_fn=<MseLossBackward>)
output :  tensor([[247996.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2901167., grad_fn=<MseLossBackward>)
output :  tensor([[58128.1133]], grad_fn=<AddmmBackward>)
loss:  tensor(9785093., grad_fn=<MseLossBackward>)
output :  tensor([[161571.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9143e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172288.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(7353079.5000, grad_fn=<MseLossBackward>)
output :  tensor([[160013.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(12343145., grad_fn=<MseLossBackward>)
output :  tensor([[274913.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(7466.0400, grad_fn=<MseLossBackward>)
output :  tensor([[193825.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(10075169., grad_fn=<MseLossBackward>)
output :  tensor([[136001.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6451e+10, grad_fn=<MseLossBackward>)
output :  tensor([[192610.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1608497.7500, grad_fn=<MseLossBackward>)
output :  tensor([[177021.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2924e+09, grad_fn=<MseLossBackward>)
output :  tensor([[152939.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3762266.2500, grad_fn=<MseLossBackward>)
output :  tensor([[174195.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(17605630., grad_fn=<MseLossBackward>)
output :  tensor([[88485.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(9519153., grad_fn=<MseLossBackward>)
output :  tensor([[166860.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9009e+09, grad_fn=<MseLossBackward>)
output :  tensor([[183280.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2956196.7500, grad_fn=<MseLossBackward>)
output :  tensor([[205598.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4902e+09, grad_fn=<MseLossBackward>)
output :  tensor([[111651.]], grad_fn=<AddmmBackward>)
loss:  tensor(2725801., grad_fn=<MseLossBackward>)
output :  tensor([[173248.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(5053785., grad_fn=<MseLossBackward>)
output :  tensor([[137791.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1668254.7500, grad_fn=<MseLossBackward>)
output :  tensor([[130253.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1570557.2500, grad_fn=<MseLossBackward>)
output :  tensor([[123430.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(15445084., grad_fn=<MseLossBackward>)
output :  tensor([[148612.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9933e+08, grad_fn=<MseLossBackward>)
output :  tensor([[169236.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1247e+10, grad_fn=<MseLossBackward>)
output :  tensor([[147972.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2983338.5000, grad_fn=<MseLossBackward>)
output :  tensor([[179512.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(237503.9375, grad_fn=<MseLossBackward>)
output :  tensor([[144078.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(9474276., grad_fn=<MseLossBackward>)
output :  tensor([[106172.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6154e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136358.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1845e+09, grad_fn=<MseLossBackward>)
output :  tensor([[134896.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(10790.0156, grad_fn=<MseLossBackward>)
output :  tensor([[129584.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(6679923., grad_fn=<MseLossBackward>)
output :  tensor([[226719.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2957325., grad_fn=<MseLossBackward>)
output :  tensor([[130545.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2903669.2500, grad_fn=<MseLossBackward>)
output :  tensor([[150768.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(3127371.2500, grad_fn=<MseLossBackward>)
output :  tensor([[113479.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(2187556.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162343.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(5489868.5000, grad_fn=<MseLossBackward>)
output :  tensor([[147532.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2532e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195419.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(11692232., grad_fn=<MseLossBackward>)
output :  tensor([[136511.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4251457.5000, grad_fn=<MseLossBackward>)
output :  tensor([[102815.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(51615020., grad_fn=<MseLossBackward>)
output :  tensor([[234307.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(94796.6406, grad_fn=<MseLossBackward>)
output :  tensor([[164889.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3620e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166186.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(51645332., grad_fn=<MseLossBackward>)
output :  tensor([[203544.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8546e+10, grad_fn=<MseLossBackward>)
output :  tensor([[241642.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2624e+10, grad_fn=<MseLossBackward>)
output :  tensor([[148388.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(23895140., grad_fn=<MseLossBackward>)
output :  tensor([[133153.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(716482.8750, grad_fn=<MseLossBackward>)
output :  tensor([[153236.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(3110152.7500, grad_fn=<MseLossBackward>)
output :  tensor([[131774.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(3147242.2500, grad_fn=<MseLossBackward>)
output :  tensor([[183912.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7893e+09, grad_fn=<MseLossBackward>)
output :  tensor([[182147.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(3812927.5000, grad_fn=<MseLossBackward>)
output :  tensor([[165276.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(14259946., grad_fn=<MseLossBackward>)
output :  tensor([[143208.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(43348.5430, grad_fn=<MseLossBackward>)
output :  tensor([[144501.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(4007941.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144532.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(218307.9688, grad_fn=<MseLossBackward>)
output :  tensor([[171904.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5943e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193224.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6526e+08, grad_fn=<MseLossBackward>)
output :  tensor([[138635.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4558759., grad_fn=<MseLossBackward>)
output :  tensor([[169526.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(5632612., grad_fn=<MseLossBackward>)
output :  tensor([[178950.]], grad_fn=<AddmmBackward>)
loss:  tensor(4202500., grad_fn=<MseLossBackward>)
output :  tensor([[118123.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(9756740., grad_fn=<MseLossBackward>)
output :  tensor([[218008.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(8950475., grad_fn=<MseLossBackward>)
output :  tensor([[182480.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1040081.2500, grad_fn=<MseLossBackward>)
output :  tensor([[126467.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(935905.0625, grad_fn=<MseLossBackward>)
output :  tensor([[197325.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(681940.5000, grad_fn=<MseLossBackward>)
output :  tensor([[180813.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(34971700., grad_fn=<MseLossBackward>)
output :  tensor([[206386.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2351e+10, grad_fn=<MseLossBackward>)
output :  tensor([[210069.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(865394.1250, grad_fn=<MseLossBackward>)
output :  tensor([[169839.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5085e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195715.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1477364.2500, grad_fn=<MseLossBackward>)
output :  tensor([[111045.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(3819123.5000, grad_fn=<MseLossBackward>)
output :  tensor([[115060.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(6556000., grad_fn=<MseLossBackward>)
output :  tensor([[114433.1016]], grad_fn=<AddmmBackward>)
loss:  tensor(5919983., grad_fn=<MseLossBackward>)
output :  tensor([[148497.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2880233.2500, grad_fn=<MseLossBackward>)
output :  tensor([[159476.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3550e+10, grad_fn=<MseLossBackward>)
output :  tensor([[178270.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2989765.2500, grad_fn=<MseLossBackward>)
output :  tensor([[127460.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1573.8577, grad_fn=<MseLossBackward>)
output :  tensor([[142951.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(4195840., grad_fn=<MseLossBackward>)
output :  tensor([[182598.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2751e+09, grad_fn=<MseLossBackward>)
output :  tensor([[120141.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(10507424., grad_fn=<MseLossBackward>)
output :  tensor([[189414.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(57532464., grad_fn=<MseLossBackward>)
output :  tensor([[144592.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(166081.7188, grad_fn=<MseLossBackward>)
output :  tensor([[209906.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(8963100., grad_fn=<MseLossBackward>)
output :  tensor([[128511.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(6306102., grad_fn=<MseLossBackward>)
output :  tensor([[247132.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1428585.2500, grad_fn=<MseLossBackward>)
output :  tensor([[235825.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4182e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150074.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4873e+08, grad_fn=<MseLossBackward>)
output :  tensor([[87281.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9071e+08, grad_fn=<MseLossBackward>)
output :  tensor([[191365.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9781e+09, grad_fn=<MseLossBackward>)
output :  tensor([[81647.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(419559.8125, grad_fn=<MseLossBackward>)
output :  tensor([[138616.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(781400.7500, grad_fn=<MseLossBackward>)
output :  tensor([[79442.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(15542998., grad_fn=<MseLossBackward>)
output :  tensor([[145507.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(6526508., grad_fn=<MseLossBackward>)
output :  tensor([[176750.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(563883.6875, grad_fn=<MseLossBackward>)
output :  tensor([[152009.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2222708.2500, grad_fn=<MseLossBackward>)
output :  tensor([[109455.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(4225979.5000, grad_fn=<MseLossBackward>)
output :  tensor([[205749.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2100e+10, grad_fn=<MseLossBackward>)
output :  tensor([[130331.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(3352646.7500, grad_fn=<MseLossBackward>)
output :  tensor([[268002.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4393e+08, grad_fn=<MseLossBackward>)
output :  tensor([[306896.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(9630742., grad_fn=<MseLossBackward>)
output :  tensor([[110236.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(7490741.5000, grad_fn=<MseLossBackward>)
output :  tensor([[171969.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(281745.3125, grad_fn=<MseLossBackward>)
output :  tensor([[134395.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9671e+08, grad_fn=<MseLossBackward>)
output :  tensor([[145419.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(41213992., grad_fn=<MseLossBackward>)
output :  tensor([[130695.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(198546.8281, grad_fn=<MseLossBackward>)
output :  tensor([[127755.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(7591962., grad_fn=<MseLossBackward>)
output :  tensor([[136105.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0783e+08, grad_fn=<MseLossBackward>)
output :  tensor([[227166.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8351e+10, grad_fn=<MseLossBackward>)
output :  tensor([[186668.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3818e+10, grad_fn=<MseLossBackward>)
output :  tensor([[142057.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(3396073., grad_fn=<MseLossBackward>)
output :  tensor([[128858.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(1845713.2500, grad_fn=<MseLossBackward>)
output :  tensor([[111866.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(380496.2188, grad_fn=<MseLossBackward>)
output :  tensor([[252960.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2381e+09, grad_fn=<MseLossBackward>)
output :  tensor([[135396.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(157212.2500, grad_fn=<MseLossBackward>)
output :  tensor([[197972.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(25276856., grad_fn=<MseLossBackward>)
output :  tensor([[102812.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(4358798., grad_fn=<MseLossBackward>)
output :  tensor([[139723.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(51493.5391, grad_fn=<MseLossBackward>)
output :  tensor([[207398.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9246e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173252.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(44185308., grad_fn=<MseLossBackward>)
output :  tensor([[187438.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(5945977.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162904.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1344e+10, grad_fn=<MseLossBackward>)
output :  tensor([[293720.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7040e+09, grad_fn=<MseLossBackward>)
output :  tensor([[198339.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(193352.5781, grad_fn=<MseLossBackward>)
output :  tensor([[260862.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0163e+10, grad_fn=<MseLossBackward>)
output :  tensor([[214142.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6892e+09, grad_fn=<MseLossBackward>)
output :  tensor([[275229.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7447e+09, grad_fn=<MseLossBackward>)
output :  tensor([[227346.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(11201572., grad_fn=<MseLossBackward>)
output :  tensor([[221340.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9125e+10, grad_fn=<MseLossBackward>)
output :  tensor([[199436.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(5937979., grad_fn=<MseLossBackward>)
output :  tensor([[160899.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0176e+09, grad_fn=<MseLossBackward>)
output :  tensor([[134261.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(3102276.7500, grad_fn=<MseLossBackward>)
output :  tensor([[135422.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(5943.4463, grad_fn=<MseLossBackward>)
output :  tensor([[90743.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(65972.7266, grad_fn=<MseLossBackward>)
output :  tensor([[105512.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(6188628., grad_fn=<MseLossBackward>)
output :  tensor([[272487.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1823e+09, grad_fn=<MseLossBackward>)
output :  tensor([[237773.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(7689702.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145999.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(998563., grad_fn=<MseLossBackward>)
output :  tensor([[141325.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(14635168., grad_fn=<MseLossBackward>)
output :  tensor([[170491.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(10504993., grad_fn=<MseLossBackward>)
output :  tensor([[145719.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(220092.9219, grad_fn=<MseLossBackward>)
output :  tensor([[164069.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2600e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163530.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2159751.7500, grad_fn=<MseLossBackward>)
output :  tensor([[136644.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(126169.2578, grad_fn=<MseLossBackward>)
output :  tensor([[190134.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5744e+09, grad_fn=<MseLossBackward>)
output :  tensor([[114320.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(5386968.5000, grad_fn=<MseLossBackward>)
output :  tensor([[175220.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(10370614., grad_fn=<MseLossBackward>)
output :  tensor([[118184.]], grad_fn=<AddmmBackward>)
loss:  tensor(3297856., grad_fn=<MseLossBackward>)
output :  tensor([[88080.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(1167666., grad_fn=<MseLossBackward>)
output :  tensor([[180387.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(150241.0312, grad_fn=<MseLossBackward>)
output :  tensor([[110143.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(59200.9727, grad_fn=<MseLossBackward>)
output :  tensor([[240537.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2364771.2500, grad_fn=<MseLossBackward>)
output :  tensor([[244889.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(12144.7285, grad_fn=<MseLossBackward>)
output :  tensor([[130026.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(276749.9688, grad_fn=<MseLossBackward>)
output :  tensor([[113247.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(18392572., grad_fn=<MseLossBackward>)
output :  tensor([[286572.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2675e+10, grad_fn=<MseLossBackward>)
output :  tensor([[173362.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(3468673.5000, grad_fn=<MseLossBackward>)
output :  tensor([[126058.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(1119711.1250, grad_fn=<MseLossBackward>)
output :  tensor([[145001.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2906e+08, grad_fn=<MseLossBackward>)
output :  tensor([[198454.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4167e+08, grad_fn=<MseLossBackward>)
output :  tensor([[143440.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(5957413., grad_fn=<MseLossBackward>)
output :  tensor([[157780.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4938e+10, grad_fn=<MseLossBackward>)
output :  tensor([[157529.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(13174518., grad_fn=<MseLossBackward>)
output :  tensor([[130195.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(483361.6875, grad_fn=<MseLossBackward>)
output :  tensor([[245480.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7694e+10, grad_fn=<MseLossBackward>)
output :  tensor([[398441.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(12666259., grad_fn=<MseLossBackward>)
output :  tensor([[100668.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(69410504., grad_fn=<MseLossBackward>)
output :  tensor([[116979.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(2313037., grad_fn=<MseLossBackward>)
output :  tensor([[157840.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2755392.5000, grad_fn=<MseLossBackward>)
output :  tensor([[133739.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1047e+08, grad_fn=<MseLossBackward>)
output :  tensor([[161884.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6139e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173414.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0214e+09, grad_fn=<MseLossBackward>)
output :  tensor([[105392.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3213504.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135123.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(34536556., grad_fn=<MseLossBackward>)
output :  tensor([[368853.]], grad_fn=<AddmmBackward>)
loss:  tensor(2430481., grad_fn=<MseLossBackward>)
output :  tensor([[202044.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6994e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174172.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1761717., grad_fn=<MseLossBackward>)
output :  tensor([[201214.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(2840963., grad_fn=<MseLossBackward>)
output :  tensor([[139244.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(59680.9648, grad_fn=<MseLossBackward>)
output :  tensor([[192734.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(3117045.5000, grad_fn=<MseLossBackward>)
output :  tensor([[134613.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3515e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177157.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(14765527., grad_fn=<MseLossBackward>)
output :  tensor([[238514.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(12151869., grad_fn=<MseLossBackward>)
output :  tensor([[174468.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(219902.3750, grad_fn=<MseLossBackward>)
output :  tensor([[106804.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1429108.1250, grad_fn=<MseLossBackward>)
output :  tensor([[264425.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(18368.7188, grad_fn=<MseLossBackward>)
output :  tensor([[248747.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1569030.2500, grad_fn=<MseLossBackward>)
output :  tensor([[117780.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(27239756., grad_fn=<MseLossBackward>)
output :  tensor([[210759.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1269e+09, grad_fn=<MseLossBackward>)
output :  tensor([[304377.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3773e+08, grad_fn=<MseLossBackward>)
output :  tensor([[208861.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(3464135.2500, grad_fn=<MseLossBackward>)
output :  tensor([[213060.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6114e+10, grad_fn=<MseLossBackward>)
output :  tensor([[159675.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(3150680.5000, grad_fn=<MseLossBackward>)
output :  tensor([[169710.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(78102.7812, grad_fn=<MseLossBackward>)
output :  tensor([[163311.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(40700212., grad_fn=<MseLossBackward>)
output :  tensor([[169662.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(113969.5391, grad_fn=<MseLossBackward>)
output :  tensor([[235158.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0786e+09, grad_fn=<MseLossBackward>)
output :  tensor([[213882.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4253e+08, grad_fn=<MseLossBackward>)
output :  tensor([[161869.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2109e+08, grad_fn=<MseLossBackward>)
output :  tensor([[120002.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(8984163., grad_fn=<MseLossBackward>)
output :  tensor([[176628.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(137826.5625, grad_fn=<MseLossBackward>)
output :  tensor([[178558.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6327e+09, grad_fn=<MseLossBackward>)
output :  tensor([[204745.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6051e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134922.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(240498.2969, grad_fn=<MseLossBackward>)
output :  tensor([[153736.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0327e+09, grad_fn=<MseLossBackward>)
output :  tensor([[279226.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(4957024., grad_fn=<MseLossBackward>)
output :  tensor([[85905.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(820453.8125, grad_fn=<MseLossBackward>)
output :  tensor([[235209.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1664382.2500, grad_fn=<MseLossBackward>)
output :  tensor([[256284.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0670e+11, grad_fn=<MseLossBackward>)
output :  tensor([[168904.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1199709.5000, grad_fn=<MseLossBackward>)
output :  tensor([[191787.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8673e+09, grad_fn=<MseLossBackward>)
output :  tensor([[153336.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2765828.7500, grad_fn=<MseLossBackward>)
output :  tensor([[205613.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1456e+09, grad_fn=<MseLossBackward>)
output :  tensor([[129827.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(684704.5625, grad_fn=<MseLossBackward>)
output :  tensor([[146688.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2850135.2500, grad_fn=<MseLossBackward>)
output :  tensor([[171774.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5697e+08, grad_fn=<MseLossBackward>)
output :  tensor([[187312.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2140186.2500, grad_fn=<MseLossBackward>)
output :  tensor([[131880.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(34574768., grad_fn=<MseLossBackward>)
output :  tensor([[138284.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3185109.5000, grad_fn=<MseLossBackward>)
output :  tensor([[176468.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(12030709., grad_fn=<MseLossBackward>)
output :  tensor([[200701.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4303e+09, grad_fn=<MseLossBackward>)
output :  tensor([[239915.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(9516454., grad_fn=<MseLossBackward>)
output :  tensor([[153920.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1165387.7500, grad_fn=<MseLossBackward>)
output :  tensor([[197328.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1765908.7500, grad_fn=<MseLossBackward>)
output :  tensor([[164118.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0474e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175497.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(16020507., grad_fn=<MseLossBackward>)
output :  tensor([[179534.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(133875.9531, grad_fn=<MseLossBackward>)
output :  tensor([[97858.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(737075.9375, grad_fn=<MseLossBackward>)
output :  tensor([[172245.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1611e+10, grad_fn=<MseLossBackward>)
output :  tensor([[132976.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(4094489., grad_fn=<MseLossBackward>)
output :  tensor([[120339.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(28506256., grad_fn=<MseLossBackward>)
output :  tensor([[174842.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(709148.1875, grad_fn=<MseLossBackward>)
output :  tensor([[87363.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(5586538.5000, grad_fn=<MseLossBackward>)
output :  tensor([[283316.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(44666248., grad_fn=<MseLossBackward>)
output :  tensor([[164142.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(735091.8750, grad_fn=<MseLossBackward>)
output :  tensor([[192720.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9726e+10, grad_fn=<MseLossBackward>)
output :  tensor([[241871.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4848e+08, grad_fn=<MseLossBackward>)
output :  tensor([[151210.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(44218.2031, grad_fn=<MseLossBackward>)
output :  tensor([[123310.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(475065.5625, grad_fn=<MseLossBackward>)
output :  tensor([[118122.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(3158256.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145975.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(9.5949e+08, grad_fn=<MseLossBackward>)
output :  tensor([[171749.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(5066790., grad_fn=<MseLossBackward>)
output :  tensor([[111558.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4441e+08, grad_fn=<MseLossBackward>)
output :  tensor([[207791.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2146e+10, grad_fn=<MseLossBackward>)
output :  tensor([[236895.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(21197680., grad_fn=<MseLossBackward>)
output :  tensor([[249006.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1370e+10, grad_fn=<MseLossBackward>)
output :  tensor([[222438.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7427e+08, grad_fn=<MseLossBackward>)
output :  tensor([[195095.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4497e+10, grad_fn=<MseLossBackward>)
output :  tensor([[188368.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(754970.9375, grad_fn=<MseLossBackward>)
output :  tensor([[205628.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8067e+10, grad_fn=<MseLossBackward>)
output :  tensor([[188151.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1859e+10, grad_fn=<MseLossBackward>)
output :  tensor([[178581.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(25276.0312, grad_fn=<MseLossBackward>)
output :  tensor([[154008.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(4032691.5000, grad_fn=<MseLossBackward>)
output :  tensor([[337118.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(14012.6406, grad_fn=<MseLossBackward>)
output :  tensor([[211612.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(150459.1406, grad_fn=<MseLossBackward>)
output :  tensor([[161615.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2609991.7500, grad_fn=<MseLossBackward>)
output :  tensor([[184864.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2075e+09, grad_fn=<MseLossBackward>)
output :  tensor([[108213.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(10324574., grad_fn=<MseLossBackward>)
output :  tensor([[271577.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0328e+10, grad_fn=<MseLossBackward>)
output :  tensor([[173727.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(29648.5352, grad_fn=<MseLossBackward>)
output :  tensor([[211730.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3131240.7500, grad_fn=<MseLossBackward>)
output :  tensor([[205104.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5267e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178970.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(52734.8164, grad_fn=<MseLossBackward>)
output :  tensor([[202806.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1013828.7500, grad_fn=<MseLossBackward>)
output :  tensor([[156954.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(3818604.5000, grad_fn=<MseLossBackward>)
output :  tensor([[149878.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4879e+09, grad_fn=<MseLossBackward>)
output :  tensor([[120248.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(3056350.7500, grad_fn=<MseLossBackward>)
output :  tensor([[139598.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(160963.9531, grad_fn=<MseLossBackward>)
output :  tensor([[147799.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1440712.6250, grad_fn=<MseLossBackward>)
output :  tensor([[200541.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6246e+10, grad_fn=<MseLossBackward>)
output :  tensor([[160928.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2041371.2500, grad_fn=<MseLossBackward>)
output :  tensor([[101730.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(4977047.5000, grad_fn=<MseLossBackward>)
output :  tensor([[223591.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6923e+08, grad_fn=<MseLossBackward>)
output :  tensor([[188243.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1727e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175695.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(624050.6250, grad_fn=<MseLossBackward>)
output :  tensor([[81844.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(24146.2461, grad_fn=<MseLossBackward>)
output :  tensor([[129412.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(831972., grad_fn=<MseLossBackward>)
output :  tensor([[216621.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(6870214.5000, grad_fn=<MseLossBackward>)
output :  tensor([[143903.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(9390.8213, grad_fn=<MseLossBackward>)
output :  tensor([[127915.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(4344065.5000, grad_fn=<MseLossBackward>)
output :  tensor([[146188.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(12877220., grad_fn=<MseLossBackward>)
output :  tensor([[179712.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7819e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146756.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(7599412., grad_fn=<MseLossBackward>)
output :  tensor([[158532.]], grad_fn=<AddmmBackward>)
loss:  tensor(2155024., grad_fn=<MseLossBackward>)
output :  tensor([[213834.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1357989.6250, grad_fn=<MseLossBackward>)
output :  tensor([[138580.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1277e+09, grad_fn=<MseLossBackward>)
output :  tensor([[259356.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(18975144., grad_fn=<MseLossBackward>)
output :  tensor([[155964.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(12502633., grad_fn=<MseLossBackward>)
output :  tensor([[126731.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(3128642.5000, grad_fn=<MseLossBackward>)
output :  tensor([[96863.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3474437.7500, grad_fn=<MseLossBackward>)
output :  tensor([[152498.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6238e+09, grad_fn=<MseLossBackward>)
output :  tensor([[180412.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(262976.6562, grad_fn=<MseLossBackward>)
output :  tensor([[118931.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2459653., grad_fn=<MseLossBackward>)
output :  tensor([[186734.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7822e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145514.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3579e+09, grad_fn=<MseLossBackward>)
output :  tensor([[149627.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(74452.2422, grad_fn=<MseLossBackward>)
output :  tensor([[187669.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(6405.0010, grad_fn=<MseLossBackward>)
output :  tensor([[250287.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8310e+09, grad_fn=<MseLossBackward>)
output :  tensor([[92239.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(546236.5000, grad_fn=<MseLossBackward>)
output :  tensor([[233287.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(45053880., grad_fn=<MseLossBackward>)
output :  tensor([[128948.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(200991.1094, grad_fn=<MseLossBackward>)
output :  tensor([[166779.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(9.8248e+09, grad_fn=<MseLossBackward>)
output :  tensor([[116459.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7091e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176072.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(5283.4727, grad_fn=<MseLossBackward>)
output :  tensor([[166784.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4992e+08, grad_fn=<MseLossBackward>)
output :  tensor([[157408.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2408e+08, grad_fn=<MseLossBackward>)
output :  tensor([[240851.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(3429499., grad_fn=<MseLossBackward>)
output :  tensor([[227495.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(9.3050e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129149.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(4619913.5000, grad_fn=<MseLossBackward>)
output :  tensor([[125376.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(389298., grad_fn=<MseLossBackward>)
output :  tensor([[223596.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(11580834., grad_fn=<MseLossBackward>)
output :  tensor([[229896.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(16840508., grad_fn=<MseLossBackward>)
output :  tensor([[229479.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(7723536., grad_fn=<MseLossBackward>)
output :  tensor([[148835.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(698347.5000, grad_fn=<MseLossBackward>)
output :  tensor([[213497.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(12235676., grad_fn=<MseLossBackward>)
output :  tensor([[132805.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6397e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134534.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(4139063., grad_fn=<MseLossBackward>)
output :  tensor([[308904.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(37152072., grad_fn=<MseLossBackward>)
output :  tensor([[146691.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(32397442., grad_fn=<MseLossBackward>)
output :  tensor([[120030.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8123e+09, grad_fn=<MseLossBackward>)
output :  tensor([[111101.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2566304., grad_fn=<MseLossBackward>)
output :  tensor([[155598.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8565e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179938.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(8.9845e+09, grad_fn=<MseLossBackward>)
output :  tensor([[170433.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(6587002.5000, grad_fn=<MseLossBackward>)
output :  tensor([[190107.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1864e+08, grad_fn=<MseLossBackward>)
output :  tensor([[95043.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(24571152., grad_fn=<MseLossBackward>)
output :  tensor([[178098.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(812026.2500, grad_fn=<MseLossBackward>)
output :  tensor([[168217.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(100984.9219, grad_fn=<MseLossBackward>)
output :  tensor([[138243.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(572694.1875, grad_fn=<MseLossBackward>)
output :  tensor([[259121.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9957e+09, grad_fn=<MseLossBackward>)
output :  tensor([[143836.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4617e+09, grad_fn=<MseLossBackward>)
output :  tensor([[175647.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(7011242., grad_fn=<MseLossBackward>)
output :  tensor([[140626.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(393031.0312, grad_fn=<MseLossBackward>)
output :  tensor([[192530.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(63508944., grad_fn=<MseLossBackward>)
output :  tensor([[167930.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(4284188.5000, grad_fn=<MseLossBackward>)
output :  tensor([[241969.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(4122422.7500, grad_fn=<MseLossBackward>)
output :  tensor([[135641.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1302843.8750, grad_fn=<MseLossBackward>)
output :  tensor([[150928.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2491366.2500, grad_fn=<MseLossBackward>)
output :  tensor([[214535.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(215934.4688, grad_fn=<MseLossBackward>)
output :  tensor([[165837.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(701798.8750, grad_fn=<MseLossBackward>)
output :  tensor([[188247.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(566279.7500, grad_fn=<MseLossBackward>)
output :  tensor([[133349.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5795e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129061.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3801.4932, grad_fn=<MseLossBackward>)
output :  tensor([[137808.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(4801713.5000, grad_fn=<MseLossBackward>)
output :  tensor([[197798.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1411e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166108.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6121e+09, grad_fn=<MseLossBackward>)
output :  tensor([[79330.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7365e+08, grad_fn=<MseLossBackward>)
output :  tensor([[93842.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(87288440., grad_fn=<MseLossBackward>)
output :  tensor([[257531.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(17965942., grad_fn=<MseLossBackward>)
output :  tensor([[202605.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0457e+09, grad_fn=<MseLossBackward>)
output :  tensor([[115388.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(150944.3906, grad_fn=<MseLossBackward>)
output :  tensor([[158002.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7011e+08, grad_fn=<MseLossBackward>)
output :  tensor([[207711.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5100e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178857.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3069e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157899.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(8408369., grad_fn=<MseLossBackward>)
output :  tensor([[167725.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(5173634.5000, grad_fn=<MseLossBackward>)
output :  tensor([[117588.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(6698876.5000, grad_fn=<MseLossBackward>)
output :  tensor([[165835.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1742e+08, grad_fn=<MseLossBackward>)
output :  tensor([[194334.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5789e+08, grad_fn=<MseLossBackward>)
output :  tensor([[218473.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1054023., grad_fn=<MseLossBackward>)
output :  tensor([[246271.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4873e+11, grad_fn=<MseLossBackward>)
output :  tensor([[148152.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1327464., grad_fn=<MseLossBackward>)
output :  tensor([[107007.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2167428., grad_fn=<MseLossBackward>)
output :  tensor([[170715.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2509e+08, grad_fn=<MseLossBackward>)
output :  tensor([[147988.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(6307397., grad_fn=<MseLossBackward>)
output :  tensor([[237999.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(999312.6250, grad_fn=<MseLossBackward>)
output :  tensor([[114816.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(33766.9336, grad_fn=<MseLossBackward>)
output :  tensor([[179170.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(13912084., grad_fn=<MseLossBackward>)
output :  tensor([[187224.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(274625.1250, grad_fn=<MseLossBackward>)
output :  tensor([[162769.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4721e+10, grad_fn=<MseLossBackward>)
output :  tensor([[97202.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6252e+08, grad_fn=<MseLossBackward>)
output :  tensor([[238043.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(915639.6875, grad_fn=<MseLossBackward>)
output :  tensor([[177300.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1692316.3750, grad_fn=<MseLossBackward>)
output :  tensor([[139370.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(396683.4688, grad_fn=<MseLossBackward>)
output :  tensor([[236824.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(3327660., grad_fn=<MseLossBackward>)
output :  tensor([[163942.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(889042.7500, grad_fn=<MseLossBackward>)
output :  tensor([[200998.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5376e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134724.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(75840., grad_fn=<MseLossBackward>)
output :  tensor([[186060.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7892e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137353.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1830651.2500, grad_fn=<MseLossBackward>)
output :  tensor([[223755.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4994e+08, grad_fn=<MseLossBackward>)
output :  tensor([[224668.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4169e+08, grad_fn=<MseLossBackward>)
output :  tensor([[91785.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(3187591.7500, grad_fn=<MseLossBackward>)
output :  tensor([[159876.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(195391.6250, grad_fn=<MseLossBackward>)
output :  tensor([[241804.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6660e+10, grad_fn=<MseLossBackward>)
output :  tensor([[149143.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(17164578., grad_fn=<MseLossBackward>)
output :  tensor([[110833.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9214e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164089.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(168728.4062, grad_fn=<MseLossBackward>)
output :  tensor([[144711.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(505543.2188, grad_fn=<MseLossBackward>)
output :  tensor([[130667.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(6086397.5000, grad_fn=<MseLossBackward>)
output :  tensor([[190862.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6427e+09, grad_fn=<MseLossBackward>)
output :  tensor([[124715.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(4910587., grad_fn=<MseLossBackward>)
output :  tensor([[148374.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(13145383., grad_fn=<MseLossBackward>)
output :  tensor([[169574.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(4732392.5000, grad_fn=<MseLossBackward>)
output :  tensor([[152199.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1439062.6250, grad_fn=<MseLossBackward>)
output :  tensor([[158949.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(15609166., grad_fn=<MseLossBackward>)
output :  tensor([[136031.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3068e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133996.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(3984577.5000, grad_fn=<MseLossBackward>)
output :  tensor([[155911.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8601e+08, grad_fn=<MseLossBackward>)
output :  tensor([[145352.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1441012.6250, grad_fn=<MseLossBackward>)
output :  tensor([[161189.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(314247.8438, grad_fn=<MseLossBackward>)
output :  tensor([[143051.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0990e+09, grad_fn=<MseLossBackward>)
output :  tensor([[147626.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1378129.2500, grad_fn=<MseLossBackward>)
output :  tensor([[188815.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(664963.8125, grad_fn=<MseLossBackward>)
output :  tensor([[169417.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(174397.5938, grad_fn=<MseLossBackward>)
output :  tensor([[179459.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(291988.2500, grad_fn=<MseLossBackward>)
output :  tensor([[218148.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3427936.5000, grad_fn=<MseLossBackward>)
output :  tensor([[113370.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(29925772., grad_fn=<MseLossBackward>)
output :  tensor([[136741.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4022e+08, grad_fn=<MseLossBackward>)
output :  tensor([[281109.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(23921576., grad_fn=<MseLossBackward>)
output :  tensor([[118976.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(8861180., grad_fn=<MseLossBackward>)
output :  tensor([[177502.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8060e+09, grad_fn=<MseLossBackward>)
output :  tensor([[184836.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(26762.9141, grad_fn=<MseLossBackward>)
output :  tensor([[192030.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(42653348., grad_fn=<MseLossBackward>)
output :  tensor([[251227.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6512e+08, grad_fn=<MseLossBackward>)
output :  tensor([[223009.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1019121.8125, grad_fn=<MseLossBackward>)
output :  tensor([[131908.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7642e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176450.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4991e+08, grad_fn=<MseLossBackward>)
output :  tensor([[122868.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(1280027.1250, grad_fn=<MseLossBackward>)
output :  tensor([[182810.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5520e+10, grad_fn=<MseLossBackward>)
output :  tensor([[159131.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(37594144., grad_fn=<MseLossBackward>)
output :  tensor([[156272.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(95493208., grad_fn=<MseLossBackward>)
output :  tensor([[204686.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2603735.2500, grad_fn=<MseLossBackward>)
output :  tensor([[143828.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2834e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174508.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2225831., grad_fn=<MseLossBackward>)
output :  tensor([[250494.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4133e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148414.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(171421.8750, grad_fn=<MseLossBackward>)
output :  tensor([[198912.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(14084774., grad_fn=<MseLossBackward>)
output :  tensor([[164160.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(17724494., grad_fn=<MseLossBackward>)
output :  tensor([[125598.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4136e+09, grad_fn=<MseLossBackward>)
output :  tensor([[133590.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4665532.5000, grad_fn=<MseLossBackward>)
output :  tensor([[180335.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(13426270., grad_fn=<MseLossBackward>)
output :  tensor([[195351.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(28635876., grad_fn=<MseLossBackward>)
output :  tensor([[222065.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4802e+09, grad_fn=<MseLossBackward>)
output :  tensor([[256300.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(489322.1250, grad_fn=<MseLossBackward>)
output :  tensor([[180824.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9092e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144770.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8377e+09, grad_fn=<MseLossBackward>)
output :  tensor([[142126.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(5632909., grad_fn=<MseLossBackward>)
output :  tensor([[73863.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1467e+09, grad_fn=<MseLossBackward>)
output :  tensor([[131052.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(15583990., grad_fn=<MseLossBackward>)
output :  tensor([[130273.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(1887511., grad_fn=<MseLossBackward>)
output :  tensor([[154506.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(256843.0781, grad_fn=<MseLossBackward>)
output :  tensor([[128953.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(3816864.2500, grad_fn=<MseLossBackward>)
output :  tensor([[78750.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(5063765.5000, grad_fn=<MseLossBackward>)
output :  tensor([[82897.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(805394.0625, grad_fn=<MseLossBackward>)
output :  tensor([[227275.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(22320162., grad_fn=<MseLossBackward>)
output :  tensor([[141667.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5076e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135728.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(27337048., grad_fn=<MseLossBackward>)
output :  tensor([[165195.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(3254641.5000, grad_fn=<MseLossBackward>)
output :  tensor([[232886.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(4465693.5000, grad_fn=<MseLossBackward>)
output :  tensor([[191212.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(860604.1250, grad_fn=<MseLossBackward>)
output :  tensor([[156742.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(551236.6250, grad_fn=<MseLossBackward>)
output :  tensor([[195680.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(4926041.5000, grad_fn=<MseLossBackward>)
output :  tensor([[197816.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5353e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136648.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(123629.1562, grad_fn=<MseLossBackward>)
output :  tensor([[153818.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1396237.6250, grad_fn=<MseLossBackward>)
output :  tensor([[136191.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(36798.0312, grad_fn=<MseLossBackward>)
output :  tensor([[197994.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0243e+09, grad_fn=<MseLossBackward>)
output :  tensor([[154820.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(672707.5625, grad_fn=<MseLossBackward>)
output :  tensor([[138391.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0152e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144980.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(6548.3496, grad_fn=<MseLossBackward>)
output :  tensor([[209625.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(5637582.5000, grad_fn=<MseLossBackward>)
output :  tensor([[104633.]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1225e+08, grad_fn=<MseLossBackward>)
output :  tensor([[168523.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1047136.5000, grad_fn=<MseLossBackward>)
output :  tensor([[126945.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(1112118.5000, grad_fn=<MseLossBackward>)
output :  tensor([[147685.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(469824.5625, grad_fn=<MseLossBackward>)
output :  tensor([[107962.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0775e+09, grad_fn=<MseLossBackward>)
output :  tensor([[140310.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(7900403.5000, grad_fn=<MseLossBackward>)
output :  tensor([[235821.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(31979.4980, grad_fn=<MseLossBackward>)
output :  tensor([[146037.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1076892.6250, grad_fn=<MseLossBackward>)
output :  tensor([[138716.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1479036., grad_fn=<MseLossBackward>)
output :  tensor([[164718.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3482e+09, grad_fn=<MseLossBackward>)
output :  tensor([[265767.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4963e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172790.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(4882788., grad_fn=<MseLossBackward>)
output :  tensor([[100740.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(4142465.2500, grad_fn=<MseLossBackward>)
output :  tensor([[200258.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9663e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158455.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(296140.0312, grad_fn=<MseLossBackward>)
output :  tensor([[161560.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6598e+10, grad_fn=<MseLossBackward>)
output :  tensor([[102809.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(20334322., grad_fn=<MseLossBackward>)
output :  tensor([[122819.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(609839., grad_fn=<MseLossBackward>)
output :  tensor([[157044.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1091339.3750, grad_fn=<MseLossBackward>)
output :  tensor([[140724.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(524583.3125, grad_fn=<MseLossBackward>)
output :  tensor([[202637.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(6958302., grad_fn=<MseLossBackward>)
output :  tensor([[138301.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(13680289., grad_fn=<MseLossBackward>)
output :  tensor([[265158.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(8285402.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128780.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2802e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164181.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1737412.3750, grad_fn=<MseLossBackward>)
output :  tensor([[188743.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(59444.5352, grad_fn=<MseLossBackward>)
output :  tensor([[122583.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5834e+08, grad_fn=<MseLossBackward>)
output :  tensor([[254484.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(20108078., grad_fn=<MseLossBackward>)
output :  tensor([[157350.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7909e+08, grad_fn=<MseLossBackward>)
output :  tensor([[243345.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(4016642.2500, grad_fn=<MseLossBackward>)
output :  tensor([[140609.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(11493583., grad_fn=<MseLossBackward>)
output :  tensor([[207231.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(7665803.5000, grad_fn=<MseLossBackward>)
output :  tensor([[174092.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2864979.5000, grad_fn=<MseLossBackward>)
output :  tensor([[151881.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(4488241., grad_fn=<MseLossBackward>)
output :  tensor([[119699.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(2886680.7500, grad_fn=<MseLossBackward>)
output :  tensor([[236092.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6007e+09, grad_fn=<MseLossBackward>)
output :  tensor([[237492.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(6286929.5000, grad_fn=<MseLossBackward>)
output :  tensor([[152747.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(347676.0625, grad_fn=<MseLossBackward>)
output :  tensor([[253184.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2942243.2500, grad_fn=<MseLossBackward>)
output :  tensor([[123611.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(82950256., grad_fn=<MseLossBackward>)
output :  tensor([[175672.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(107471.2812, grad_fn=<MseLossBackward>)
output :  tensor([[157861.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(4574652.5000, grad_fn=<MseLossBackward>)
output :  tensor([[131981.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(963526.3125, grad_fn=<MseLossBackward>)
output :  tensor([[196104.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4362e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164220.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(48737.4609, grad_fn=<MseLossBackward>)
output :  tensor([[165685.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(7209812.5000, grad_fn=<MseLossBackward>)
output :  tensor([[157287.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(507522.6562, grad_fn=<MseLossBackward>)
output :  tensor([[153034.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(9825286., grad_fn=<MseLossBackward>)
output :  tensor([[174724.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2543e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159641.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(128600.6875, grad_fn=<MseLossBackward>)
output :  tensor([[376470.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(56247188., grad_fn=<MseLossBackward>)
output :  tensor([[137127.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0256e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129348.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9227e+09, grad_fn=<MseLossBackward>)
output :  tensor([[288621.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(54892356., grad_fn=<MseLossBackward>)
output :  tensor([[162274.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(75255.9219, grad_fn=<MseLossBackward>)
output :  tensor([[132512.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4431e+08, grad_fn=<MseLossBackward>)
output :  tensor([[240693.]], grad_fn=<AddmmBackward>)
loss:  tensor(75568248., grad_fn=<MseLossBackward>)
output :  tensor([[179678.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(675273.0625, grad_fn=<MseLossBackward>)
output :  tensor([[154541.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(6460334., grad_fn=<MseLossBackward>)
output :  tensor([[144666.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(111013.9062, grad_fn=<MseLossBackward>)
output :  tensor([[154309.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0308e+08, grad_fn=<MseLossBackward>)
output :  tensor([[98411.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(2523853.5000, grad_fn=<MseLossBackward>)
output :  tensor([[81601.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6663e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163719.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1640480.6250, grad_fn=<MseLossBackward>)
output :  tensor([[188398.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5683e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161287.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(10810225., grad_fn=<MseLossBackward>)
output :  tensor([[160090.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(6712066.5000, grad_fn=<MseLossBackward>)
output :  tensor([[136444.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1010244.8750, grad_fn=<MseLossBackward>)
output :  tensor([[205472.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(228185.3438, grad_fn=<MseLossBackward>)
output :  tensor([[139587.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2520999.7500, grad_fn=<MseLossBackward>)
output :  tensor([[181566.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6495e+10, grad_fn=<MseLossBackward>)
output :  tensor([[146813.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(661273.9375, grad_fn=<MseLossBackward>)
output :  tensor([[111315.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0177e+08, grad_fn=<MseLossBackward>)
output :  tensor([[93052.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(897682.2500, grad_fn=<MseLossBackward>)
output :  tensor([[176407.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1981628.1250, grad_fn=<MseLossBackward>)
output :  tensor([[257788.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(6821483., grad_fn=<MseLossBackward>)
output :  tensor([[139118.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(5673552., grad_fn=<MseLossBackward>)
output :  tensor([[158959.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(875160.2500, grad_fn=<MseLossBackward>)
output :  tensor([[133745.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1551698.3750, grad_fn=<MseLossBackward>)
output :  tensor([[148980.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(269523.2188, grad_fn=<MseLossBackward>)
output :  tensor([[166676.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1497984.7500, grad_fn=<MseLossBackward>)
output :  tensor([[131525.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(20477604., grad_fn=<MseLossBackward>)
output :  tensor([[174577.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7484e+08, grad_fn=<MseLossBackward>)
output :  tensor([[160461.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(11983929., grad_fn=<MseLossBackward>)
output :  tensor([[114022.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(6139632., grad_fn=<MseLossBackward>)
output :  tensor([[162146.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0202e+09, grad_fn=<MseLossBackward>)
output :  tensor([[50519.6758]], grad_fn=<AddmmBackward>)
loss:  tensor(2191359.7500, grad_fn=<MseLossBackward>)
output :  tensor([[232419.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4129e+09, grad_fn=<MseLossBackward>)
output :  tensor([[201314.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(98625.4375, grad_fn=<MseLossBackward>)
output :  tensor([[183437.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2442431.7500, grad_fn=<MseLossBackward>)
output :  tensor([[105572.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(182929.9688, grad_fn=<MseLossBackward>)
output :  tensor([[88164.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1354968.7500, grad_fn=<MseLossBackward>)
output :  tensor([[138795.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1451384.8750, grad_fn=<MseLossBackward>)
output :  tensor([[218627.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6810e+09, grad_fn=<MseLossBackward>)
output :  tensor([[199764.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(59839168., grad_fn=<MseLossBackward>)
output :  tensor([[170060.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(25611982., grad_fn=<MseLossBackward>)
output :  tensor([[172476.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5607e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192246.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(5045007.5000, grad_fn=<MseLossBackward>)
output :  tensor([[88625.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2643368., grad_fn=<MseLossBackward>)
output :  tensor([[137924.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(4309387., grad_fn=<MseLossBackward>)
output :  tensor([[112366.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(3483326.5000, grad_fn=<MseLossBackward>)
output :  tensor([[149444.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8183e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172960.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7606e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193004.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4389e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181248.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1557972., grad_fn=<MseLossBackward>)
output :  tensor([[96371.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(16550.4199, grad_fn=<MseLossBackward>)
output :  tensor([[118379.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(773479., grad_fn=<MseLossBackward>)
output :  tensor([[160025.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7476e+08, grad_fn=<MseLossBackward>)
output :  tensor([[199183.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(666289.5625, grad_fn=<MseLossBackward>)
output :  tensor([[144237.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(56309.8086, grad_fn=<MseLossBackward>)
train_loss: [2.6486966e+09]
epoch_result tensor([0.])
output :  tensor([[157467.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1066185.3750, grad_fn=<MseLossBackward>)
output :  tensor([[123982.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(3928540.7500, grad_fn=<MseLossBackward>)
output :  tensor([[195579.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1900994.6250, grad_fn=<MseLossBackward>)
output :  tensor([[177623.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(389181.0312, grad_fn=<MseLossBackward>)
output :  tensor([[153512.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9962e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133633.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(31732274., grad_fn=<MseLossBackward>)
output :  tensor([[141306.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(94066.8047, grad_fn=<MseLossBackward>)
output :  tensor([[118622.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(142423.6875, grad_fn=<MseLossBackward>)
output :  tensor([[69621.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2368e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165780.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(48262.5977, grad_fn=<MseLossBackward>)
output :  tensor([[137906.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(4384443.5000, grad_fn=<MseLossBackward>)
output :  tensor([[225654.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(427736.4375, grad_fn=<MseLossBackward>)
output :  tensor([[169479.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(230250.0312, grad_fn=<MseLossBackward>)
output :  tensor([[250149.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(201727.2969, grad_fn=<MseLossBackward>)
output :  tensor([[56400.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1961750.3750, grad_fn=<MseLossBackward>)
output :  tensor([[163090.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4560e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178276.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(10737193., grad_fn=<MseLossBackward>)
output :  tensor([[156516.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(267.6292, grad_fn=<MseLossBackward>)
output :  tensor([[276020.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1041930.5625, grad_fn=<MseLossBackward>)
output :  tensor([[200611.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(13044964., grad_fn=<MseLossBackward>)
output :  tensor([[137735.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5496e+10, grad_fn=<MseLossBackward>)
output :  tensor([[194903.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1050048.5000, grad_fn=<MseLossBackward>)
output :  tensor([[177943.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2049e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151565.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(319436.9062, grad_fn=<MseLossBackward>)
output :  tensor([[171434.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2057924.7500, grad_fn=<MseLossBackward>)
output :  tensor([[86603.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1449089.2500, grad_fn=<MseLossBackward>)
output :  tensor([[167444.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9642e+09, grad_fn=<MseLossBackward>)
output :  tensor([[185702.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(493418.4375, grad_fn=<MseLossBackward>)
output :  tensor([[203075.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7483e+09, grad_fn=<MseLossBackward>)
output :  tensor([[107203.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(7818446., grad_fn=<MseLossBackward>)
output :  tensor([[171315.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(99688.1953, grad_fn=<MseLossBackward>)
output :  tensor([[136063.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(190518.6094, grad_fn=<MseLossBackward>)
output :  tensor([[126648.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(5529405.5000, grad_fn=<MseLossBackward>)
output :  tensor([[121412.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(3657506.7500, grad_fn=<MseLossBackward>)
output :  tensor([[146215.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5355e+08, grad_fn=<MseLossBackward>)
output :  tensor([[168615.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1429e+10, grad_fn=<MseLossBackward>)
output :  tensor([[150785.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1177937.1250, grad_fn=<MseLossBackward>)
output :  tensor([[180933.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(871626.4375, grad_fn=<MseLossBackward>)
output :  tensor([[141158.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(25028.2285, grad_fn=<MseLossBackward>)
output :  tensor([[102558.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5770e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136289.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1953e+09, grad_fn=<MseLossBackward>)
output :  tensor([[139152.]], grad_fn=<AddmmBackward>)
loss:  tensor(17239104., grad_fn=<MseLossBackward>)
output :  tensor([[138067.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2248e+08, grad_fn=<MseLossBackward>)
output :  tensor([[220566.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(19657308., grad_fn=<MseLossBackward>)
output :  tensor([[131738.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(261280.7188, grad_fn=<MseLossBackward>)
output :  tensor([[147143.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(3447578.5000, grad_fn=<MseLossBackward>)
output :  tensor([[113848.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(3415161.7500, grad_fn=<MseLossBackward>)
output :  tensor([[161470.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2161864.7500, grad_fn=<MseLossBackward>)
output :  tensor([[142021.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8067e+09, grad_fn=<MseLossBackward>)
output :  tensor([[190822.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1386285.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135301.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(725025.6250, grad_fn=<MseLossBackward>)
output :  tensor([[117652.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(58559320., grad_fn=<MseLossBackward>)
output :  tensor([[232337.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2762711.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163232.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5258e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159745.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(555164.6875, grad_fn=<MseLossBackward>)
output :  tensor([[202036.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9058e+10, grad_fn=<MseLossBackward>)
output :  tensor([[241462.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2665e+10, grad_fn=<MseLossBackward>)
output :  tensor([[142958.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(293171.5000, grad_fn=<MseLossBackward>)
output :  tensor([[141308.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(53416456., grad_fn=<MseLossBackward>)
output :  tensor([[152722.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(5184942.5000, grad_fn=<MseLossBackward>)
output :  tensor([[132931.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(8593784., grad_fn=<MseLossBackward>)
output :  tensor([[180167.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3732e+09, grad_fn=<MseLossBackward>)
output :  tensor([[183273.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(683748.1250, grad_fn=<MseLossBackward>)
output :  tensor([[160478.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1043143.0625, grad_fn=<MseLossBackward>)
output :  tensor([[132287.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1476e+08, grad_fn=<MseLossBackward>)
output :  tensor([[146517.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(16142817., grad_fn=<MseLossBackward>)
output :  tensor([[149939.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(24401902., grad_fn=<MseLossBackward>)
output :  tensor([[170802.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7449e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195173.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7639e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137468.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(937266., grad_fn=<MseLossBackward>)
output :  tensor([[173678.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(3164229.5000, grad_fn=<MseLossBackward>)
output :  tensor([[179846.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1330922.7500, grad_fn=<MseLossBackward>)
output :  tensor([[118488.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(12167016., grad_fn=<MseLossBackward>)
output :  tensor([[220834.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(27385.0781, grad_fn=<MseLossBackward>)
output :  tensor([[188025.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(20479868., grad_fn=<MseLossBackward>)
output :  tensor([[125933.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(188233.9531, grad_fn=<MseLossBackward>)
output :  tensor([[191901.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(21143616., grad_fn=<MseLossBackward>)
output :  tensor([[177321.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(5863435., grad_fn=<MseLossBackward>)
output :  tensor([[210730.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0807e+10, grad_fn=<MseLossBackward>)
output :  tensor([[209953.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1096045.3750, grad_fn=<MseLossBackward>)
output :  tensor([[167334.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3202e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193902.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(356539.5938, grad_fn=<MseLossBackward>)
output :  tensor([[111925.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(1154869.2500, grad_fn=<MseLossBackward>)
output :  tensor([[115330.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(8010624.5000, grad_fn=<MseLossBackward>)
output :  tensor([[111448.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(304462.5625, grad_fn=<MseLossBackward>)
output :  tensor([[146800.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(0.9690, grad_fn=<MseLossBackward>)
output :  tensor([[160538.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3162e+10, grad_fn=<MseLossBackward>)
output :  tensor([[178710.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1662447.6250, grad_fn=<MseLossBackward>)
output :  tensor([[128894.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(1944085.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145640.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(410220.2500, grad_fn=<MseLossBackward>)
output :  tensor([[184776.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4877e+09, grad_fn=<MseLossBackward>)
output :  tensor([[119878.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(8871043., grad_fn=<MseLossBackward>)
output :  tensor([[200480.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(12113119., grad_fn=<MseLossBackward>)
output :  tensor([[145766.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(587737.8750, grad_fn=<MseLossBackward>)
output :  tensor([[212819.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(6492.8340, grad_fn=<MseLossBackward>)
output :  tensor([[128857.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(8167449.5000, grad_fn=<MseLossBackward>)
output :  tensor([[244727.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(12961575., grad_fn=<MseLossBackward>)
output :  tensor([[233964.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6046e+09, grad_fn=<MseLossBackward>)
output :  tensor([[147566.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6136e+08, grad_fn=<MseLossBackward>)
output :  tensor([[84634.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5860e+08, grad_fn=<MseLossBackward>)
output :  tensor([[188411.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4802e+09, grad_fn=<MseLossBackward>)
output :  tensor([[76476.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(20463678., grad_fn=<MseLossBackward>)
output :  tensor([[138249.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1564649.1250, grad_fn=<MseLossBackward>)
output :  tensor([[76997.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(2242623.2500, grad_fn=<MseLossBackward>)
output :  tensor([[145946.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(8963475., grad_fn=<MseLossBackward>)
output :  tensor([[175619.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(144863.5000, grad_fn=<MseLossBackward>)
output :  tensor([[151289.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(4886172., grad_fn=<MseLossBackward>)
output :  tensor([[109419.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(4079106., grad_fn=<MseLossBackward>)
output :  tensor([[201213.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3119e+10, grad_fn=<MseLossBackward>)
output :  tensor([[128959.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(211535.3125, grad_fn=<MseLossBackward>)
output :  tensor([[265580.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0792e+08, grad_fn=<MseLossBackward>)
output :  tensor([[303754.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(39005100., grad_fn=<MseLossBackward>)
output :  tensor([[109338.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(3378473.7500, grad_fn=<MseLossBackward>)
output :  tensor([[171619.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(775252.7500, grad_fn=<MseLossBackward>)
output :  tensor([[134591.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0713e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134840.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(17303000., grad_fn=<MseLossBackward>)
output :  tensor([[130671.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(177293.6250, grad_fn=<MseLossBackward>)
output :  tensor([[124275.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(524787.0625, grad_fn=<MseLossBackward>)
output :  tensor([[136516.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2989e+08, grad_fn=<MseLossBackward>)
output :  tensor([[224630.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9350e+10, grad_fn=<MseLossBackward>)
output :  tensor([[188329.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3308e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143619.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(78461.2656, grad_fn=<MseLossBackward>)
output :  tensor([[130632.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(9813486., grad_fn=<MseLossBackward>)
output :  tensor([[112014.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(585009.8750, grad_fn=<MseLossBackward>)
output :  tensor([[252640.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2799e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136544.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2385818., grad_fn=<MseLossBackward>)
output :  tensor([[203653.]], grad_fn=<AddmmBackward>)
loss:  tensor(426409., grad_fn=<MseLossBackward>)
output :  tensor([[107978.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(9475479., grad_fn=<MseLossBackward>)
output :  tensor([[141088.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1295186.2500, grad_fn=<MseLossBackward>)
output :  tensor([[202126.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0056e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180693.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(630163.0625, grad_fn=<MseLossBackward>)
output :  tensor([[185557.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(310527.5625, grad_fn=<MseLossBackward>)
output :  tensor([[162533.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1452e+10, grad_fn=<MseLossBackward>)
output :  tensor([[292191.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8326e+09, grad_fn=<MseLossBackward>)
output :  tensor([[197493.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(165051.7656, grad_fn=<MseLossBackward>)
output :  tensor([[258661.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0794e+10, grad_fn=<MseLossBackward>)
output :  tensor([[216830.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4177e+09, grad_fn=<MseLossBackward>)
output :  tensor([[280827.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3085e+09, grad_fn=<MseLossBackward>)
output :  tensor([[224904.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(818120.2500, grad_fn=<MseLossBackward>)
output :  tensor([[222756.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8643e+10, grad_fn=<MseLossBackward>)
output :  tensor([[196477.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(273414.5938, grad_fn=<MseLossBackward>)
output :  tensor([[160100.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6725e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133867.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1871124.7500, grad_fn=<MseLossBackward>)
output :  tensor([[138284.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(7751265., grad_fn=<MseLossBackward>)
output :  tensor([[93187.]], grad_fn=<AddmmBackward>)
loss:  tensor(4782969., grad_fn=<MseLossBackward>)
output :  tensor([[105378.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(6874638., grad_fn=<MseLossBackward>)
output :  tensor([[268732.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6202e+09, grad_fn=<MseLossBackward>)
output :  tensor([[235416.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(173706.6094, grad_fn=<MseLossBackward>)
output :  tensor([[143261.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3022491., grad_fn=<MseLossBackward>)
output :  tensor([[138545.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1093070.2500, grad_fn=<MseLossBackward>)
output :  tensor([[175047.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1728444.2500, grad_fn=<MseLossBackward>)
output :  tensor([[144832.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(173993.2656, grad_fn=<MseLossBackward>)
output :  tensor([[165203.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5831e+08, grad_fn=<MseLossBackward>)
output :  tensor([[164343.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(431279.5312, grad_fn=<MseLossBackward>)
output :  tensor([[137161.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(25926.0312, grad_fn=<MseLossBackward>)
output :  tensor([[186449.]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0895e+09, grad_fn=<MseLossBackward>)
output :  tensor([[111283.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(513876.1562, grad_fn=<MseLossBackward>)
output :  tensor([[174102.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(4420703.5000, grad_fn=<MseLossBackward>)
output :  tensor([[122741.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(7513295., grad_fn=<MseLossBackward>)
output :  tensor([[86487.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(262872.5000, grad_fn=<MseLossBackward>)
output :  tensor([[179245.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(568775.1875, grad_fn=<MseLossBackward>)
output :  tensor([[110939.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(1081193.7500, grad_fn=<MseLossBackward>)
output :  tensor([[242000.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(9004407., grad_fn=<MseLossBackward>)
output :  tensor([[248505.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(12290831., grad_fn=<MseLossBackward>)
output :  tensor([[120197.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(86537232., grad_fn=<MseLossBackward>)
output :  tensor([[109531.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(327738.3750, grad_fn=<MseLossBackward>)
output :  tensor([[289772.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1721e+10, grad_fn=<MseLossBackward>)
output :  tensor([[177351.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(34240784., grad_fn=<MseLossBackward>)
output :  tensor([[123939.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(1124411.7500, grad_fn=<MseLossBackward>)
output :  tensor([[145568.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6001e+08, grad_fn=<MseLossBackward>)
output :  tensor([[199331.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1518e+08, grad_fn=<MseLossBackward>)
output :  tensor([[143335.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(5455655., grad_fn=<MseLossBackward>)
output :  tensor([[156877.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5159e+10, grad_fn=<MseLossBackward>)
output :  tensor([[150020.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(15052824., grad_fn=<MseLossBackward>)
output :  tensor([[128863.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(405759.0625, grad_fn=<MseLossBackward>)
output :  tensor([[246399.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7451e+10, grad_fn=<MseLossBackward>)
output :  tensor([[396583.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(29336780., grad_fn=<MseLossBackward>)
output :  tensor([[113396.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(19326808., grad_fn=<MseLossBackward>)
output :  tensor([[123264.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(22697184., grad_fn=<MseLossBackward>)
output :  tensor([[159492.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(54.3906, grad_fn=<MseLossBackward>)
output :  tensor([[130784.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3894e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163554.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4159e+09, grad_fn=<MseLossBackward>)
output :  tensor([[171121.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7358e+09, grad_fn=<MseLossBackward>)
output :  tensor([[103913.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(98203.8906, grad_fn=<MseLossBackward>)
output :  tensor([[138548.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(6011921., grad_fn=<MseLossBackward>)
output :  tensor([[361798.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(30202238., grad_fn=<MseLossBackward>)
output :  tensor([[200703.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8405e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174765.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(539306.6250, grad_fn=<MseLossBackward>)
output :  tensor([[206794.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(15168226., grad_fn=<MseLossBackward>)
output :  tensor([[137507.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2227276.5000, grad_fn=<MseLossBackward>)
output :  tensor([[194285.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(45963.3398, grad_fn=<MseLossBackward>)
output :  tensor([[135284.]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7195e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180437.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(316037.2188, grad_fn=<MseLossBackward>)
output :  tensor([[240536.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2143250.2500, grad_fn=<MseLossBackward>)
output :  tensor([[170915.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(9516165., grad_fn=<MseLossBackward>)
output :  tensor([[110221.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4932910.5000, grad_fn=<MseLossBackward>)
output :  tensor([[267147.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(6688366., grad_fn=<MseLossBackward>)
output :  tensor([[249396.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(363835.1562, grad_fn=<MseLossBackward>)
output :  tensor([[121583.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(2005343.6250, grad_fn=<MseLossBackward>)
output :  tensor([[213226.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8160e+09, grad_fn=<MseLossBackward>)
output :  tensor([[304267.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4236e+08, grad_fn=<MseLossBackward>)
output :  tensor([[204605.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(5734079., grad_fn=<MseLossBackward>)
output :  tensor([[216203.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5326e+10, grad_fn=<MseLossBackward>)
output :  tensor([[159570.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2790622.5000, grad_fn=<MseLossBackward>)
output :  tensor([[168620.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1874760., grad_fn=<MseLossBackward>)
output :  tensor([[161499.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(20858916., grad_fn=<MseLossBackward>)
output :  tensor([[169561.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(192145.2500, grad_fn=<MseLossBackward>)
output :  tensor([[234740.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1062e+09, grad_fn=<MseLossBackward>)
output :  tensor([[217839.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3495e+08, grad_fn=<MseLossBackward>)
output :  tensor([[161893.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2181e+08, grad_fn=<MseLossBackward>)
output :  tensor([[121756.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(1546661.3750, grad_fn=<MseLossBackward>)
output :  tensor([[175687.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1723189.5000, grad_fn=<MseLossBackward>)
output :  tensor([[179456.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4872e+09, grad_fn=<MseLossBackward>)
output :  tensor([[204390.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6186e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134704.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(73992.5000, grad_fn=<MseLossBackward>)
output :  tensor([[151687.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(9.0524e+08, grad_fn=<MseLossBackward>)
output :  tensor([[272831.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(17374048., grad_fn=<MseLossBackward>)
output :  tensor([[88854.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(14857050., grad_fn=<MseLossBackward>)
output :  tensor([[233236.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(10652064., grad_fn=<MseLossBackward>)
output :  tensor([[260528.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0394e+11, grad_fn=<MseLossBackward>)
output :  tensor([[169996.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(11.9241, grad_fn=<MseLossBackward>)
output :  tensor([[193581.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7155e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157712.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(7356385., grad_fn=<MseLossBackward>)
output :  tensor([[206298.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0579e+09, grad_fn=<MseLossBackward>)
output :  tensor([[127719.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(1640860.8750, grad_fn=<MseLossBackward>)
output :  tensor([[149002.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(16018630., grad_fn=<MseLossBackward>)
output :  tensor([[171860.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(8.6201e+08, grad_fn=<MseLossBackward>)
output :  tensor([[186489.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(409240.0938, grad_fn=<MseLossBackward>)
output :  tensor([[130985.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(24852172., grad_fn=<MseLossBackward>)
output :  tensor([[138548.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(4196096., grad_fn=<MseLossBackward>)
output :  tensor([[176745.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(14026546., grad_fn=<MseLossBackward>)
output :  tensor([[199865.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5134e+09, grad_fn=<MseLossBackward>)
output :  tensor([[239034.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(15722340., grad_fn=<MseLossBackward>)
output :  tensor([[154311.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(474484.1875, grad_fn=<MseLossBackward>)
output :  tensor([[197473.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2172491.7500, grad_fn=<MseLossBackward>)
output :  tensor([[166203.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9300e+08, grad_fn=<MseLossBackward>)
output :  tensor([[192262.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6288e+08, grad_fn=<MseLossBackward>)
output :  tensor([[182808.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(8460281., grad_fn=<MseLossBackward>)
output :  tensor([[95531.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(2156102.2500, grad_fn=<MseLossBackward>)
output :  tensor([[172565.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1542e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134986.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(177.2227, grad_fn=<MseLossBackward>)
output :  tensor([[122661.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(58694632., grad_fn=<MseLossBackward>)
output :  tensor([[173809.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(36236.6914, grad_fn=<MseLossBackward>)
output :  tensor([[89241.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(17992974., grad_fn=<MseLossBackward>)
output :  tensor([[289637.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(131134.5156, grad_fn=<MseLossBackward>)
output :  tensor([[170402.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(29187006., grad_fn=<MseLossBackward>)
output :  tensor([[191196.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0156e+10, grad_fn=<MseLossBackward>)
output :  tensor([[243113.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7768e+08, grad_fn=<MseLossBackward>)
output :  tensor([[147579.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(11698217., grad_fn=<MseLossBackward>)
output :  tensor([[125871.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(3503272.5000, grad_fn=<MseLossBackward>)
output :  tensor([[119631.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(72348.3906, grad_fn=<MseLossBackward>)
output :  tensor([[147213.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0377e+09, grad_fn=<MseLossBackward>)
output :  tensor([[175403.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1968496.7500, grad_fn=<MseLossBackward>)
output :  tensor([[111370.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3350e+08, grad_fn=<MseLossBackward>)
output :  tensor([[208276.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2039e+10, grad_fn=<MseLossBackward>)
output :  tensor([[245922.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(19562652., grad_fn=<MseLossBackward>)
output :  tensor([[249434.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1245e+10, grad_fn=<MseLossBackward>)
output :  tensor([[221253.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1493e+08, grad_fn=<MseLossBackward>)
output :  tensor([[195956.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4291e+10, grad_fn=<MseLossBackward>)
output :  tensor([[188802.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1696994.7500, grad_fn=<MseLossBackward>)
output :  tensor([[204083.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8747e+10, grad_fn=<MseLossBackward>)
output :  tensor([[189562.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1444e+10, grad_fn=<MseLossBackward>)
output :  tensor([[183703.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(24631834., grad_fn=<MseLossBackward>)
output :  tensor([[152338.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(114783.3203, grad_fn=<MseLossBackward>)
output :  tensor([[330436.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(43077480., grad_fn=<MseLossBackward>)
output :  tensor([[212089.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(7996.2715, grad_fn=<MseLossBackward>)
output :  tensor([[157152.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(8107277.5000, grad_fn=<MseLossBackward>)
output :  tensor([[184864.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2076e+09, grad_fn=<MseLossBackward>)
output :  tensor([[108233.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(10454865., grad_fn=<MseLossBackward>)
output :  tensor([[272895.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9583e+10, grad_fn=<MseLossBackward>)
output :  tensor([[170394.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(12287216., grad_fn=<MseLossBackward>)
output :  tensor([[217135.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(13216406., grad_fn=<MseLossBackward>)
output :  tensor([[208344.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6017e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180495.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1677308.2500, grad_fn=<MseLossBackward>)
output :  tensor([[200128.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2793807.7500, grad_fn=<MseLossBackward>)
output :  tensor([[157117.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(4482681.5000, grad_fn=<MseLossBackward>)
output :  tensor([[150334.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5336e+09, grad_fn=<MseLossBackward>)
output :  tensor([[120625.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(4519112., grad_fn=<MseLossBackward>)
output :  tensor([[140356.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(127103.3906, grad_fn=<MseLossBackward>)
output :  tensor([[149873.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(763657.5000, grad_fn=<MseLossBackward>)
output :  tensor([[202282.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5805e+10, grad_fn=<MseLossBackward>)
output :  tensor([[162018.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(6343078.5000, grad_fn=<MseLossBackward>)
output :  tensor([[98024.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2177423., grad_fn=<MseLossBackward>)
output :  tensor([[221580.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3928e+08, grad_fn=<MseLossBackward>)
output :  tensor([[186156.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2667e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176467.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(315.0625, grad_fn=<MseLossBackward>)
output :  tensor([[85874.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(15012719., grad_fn=<MseLossBackward>)
output :  tensor([[128220.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(78365., grad_fn=<MseLossBackward>)
output :  tensor([[215465.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2146454., grad_fn=<MseLossBackward>)
output :  tensor([[143489.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(260259.4062, grad_fn=<MseLossBackward>)
output :  tensor([[133915.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(15328571., grad_fn=<MseLossBackward>)
output :  tensor([[146517.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(15345582., grad_fn=<MseLossBackward>)
output :  tensor([[179065.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7277e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145031.]], grad_fn=<AddmmBackward>)
loss:  tensor(1062961., grad_fn=<MseLossBackward>)
output :  tensor([[159237.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(580667.8125, grad_fn=<MseLossBackward>)
output :  tensor([[214748.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(63370.1953, grad_fn=<MseLossBackward>)
output :  tensor([[138533.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1245e+09, grad_fn=<MseLossBackward>)
output :  tensor([[257736.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(7487320.5000, grad_fn=<MseLossBackward>)
output :  tensor([[158650.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(722234.3750, grad_fn=<MseLossBackward>)
output :  tensor([[129114.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(378119.3125, grad_fn=<MseLossBackward>)
output :  tensor([[95388.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(150986.8906, grad_fn=<MseLossBackward>)
output :  tensor([[152701.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6514e+09, grad_fn=<MseLossBackward>)
output :  tensor([[176853.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(9281257., grad_fn=<MseLossBackward>)
output :  tensor([[122687.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(4786250., grad_fn=<MseLossBackward>)
output :  tensor([[187538.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7149e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145739.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3877e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150205.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(93406.6406, grad_fn=<MseLossBackward>)
output :  tensor([[189502.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(3069668.2500, grad_fn=<MseLossBackward>)
output :  tensor([[250850.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7831e+09, grad_fn=<MseLossBackward>)
output :  tensor([[90288.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1467013., grad_fn=<MseLossBackward>)
output :  tensor([[235039.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(24605166., grad_fn=<MseLossBackward>)
output :  tensor([[130735.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(4995399.5000, grad_fn=<MseLossBackward>)
output :  tensor([[166254.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9292e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113480.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8173e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174486.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2291391.7500, grad_fn=<MseLossBackward>)
output :  tensor([[164850.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4771e+08, grad_fn=<MseLossBackward>)
output :  tensor([[155047.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0257e+08, grad_fn=<MseLossBackward>)
output :  tensor([[238360.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(408620.5938, grad_fn=<MseLossBackward>)
output :  tensor([[226037.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0216e+09, grad_fn=<MseLossBackward>)
output :  tensor([[127064.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4098., grad_fn=<MseLossBackward>)
output :  tensor([[129119.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(9731329., grad_fn=<MseLossBackward>)
output :  tensor([[223381.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(13090263., grad_fn=<MseLossBackward>)
output :  tensor([[226964.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(49494964., grad_fn=<MseLossBackward>)
output :  tensor([[228791.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(4374437.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145749.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(5065946., grad_fn=<MseLossBackward>)
output :  tensor([[211310.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1716386.6250, grad_fn=<MseLossBackward>)
output :  tensor([[132699.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6129e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133062.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(316494.1562, grad_fn=<MseLossBackward>)
output :  tensor([[307031.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(63504464., grad_fn=<MseLossBackward>)
output :  tensor([[137162.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(14723408., grad_fn=<MseLossBackward>)
output :  tensor([[119941.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8028e+09, grad_fn=<MseLossBackward>)
output :  tensor([[107895.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(2574295., grad_fn=<MseLossBackward>)
output :  tensor([[155144.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0122e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178231.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(9.3110e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174134.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1287693., grad_fn=<MseLossBackward>)
output :  tensor([[192063.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(79861312., grad_fn=<MseLossBackward>)
output :  tensor([[100894.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(800284., grad_fn=<MseLossBackward>)
output :  tensor([[181482.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(6162651., grad_fn=<MseLossBackward>)
output :  tensor([[166011.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(3567022.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140577.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2488752.7500, grad_fn=<MseLossBackward>)
output :  tensor([[257840.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0254e+10, grad_fn=<MseLossBackward>)
output :  tensor([[141573.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2005e+09, grad_fn=<MseLossBackward>)
output :  tensor([[172865.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(18220.7812, grad_fn=<MseLossBackward>)
output :  tensor([[137007.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(8957955., grad_fn=<MseLossBackward>)
output :  tensor([[201897.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1953181., grad_fn=<MseLossBackward>)
output :  tensor([[169151.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(720668.3750, grad_fn=<MseLossBackward>)
output :  tensor([[240732.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(10677475., grad_fn=<MseLossBackward>)
output :  tensor([[133329.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1369558.2500, grad_fn=<MseLossBackward>)
output :  tensor([[152139.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(7783751.5000, grad_fn=<MseLossBackward>)
output :  tensor([[213223.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(3155563.7500, grad_fn=<MseLossBackward>)
output :  tensor([[165546.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(299140.6250, grad_fn=<MseLossBackward>)
output :  tensor([[206556.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0822e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134754.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8783e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128264.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(540684.5000, grad_fn=<MseLossBackward>)
output :  tensor([[137499.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(6253750.5000, grad_fn=<MseLossBackward>)
output :  tensor([[198567.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0315e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166445.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6467e+09, grad_fn=<MseLossBackward>)
output :  tensor([[75761.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4842e+08, grad_fn=<MseLossBackward>)
output :  tensor([[93723.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(85077272., grad_fn=<MseLossBackward>)
output :  tensor([[249949.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(11182232., grad_fn=<MseLossBackward>)
output :  tensor([[203585.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1712e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113284.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2941332.2500, grad_fn=<MseLossBackward>)
output :  tensor([[158626.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3366e+08, grad_fn=<MseLossBackward>)
output :  tensor([[206517.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8177e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180399.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0283e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157843.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(8086292., grad_fn=<MseLossBackward>)
output :  tensor([[170677.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(458455.9375, grad_fn=<MseLossBackward>)
output :  tensor([[114653.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(120289.7500, grad_fn=<MseLossBackward>)
output :  tensor([[164697.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(94042416., grad_fn=<MseLossBackward>)
output :  tensor([[194960.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4255e+08, grad_fn=<MseLossBackward>)
output :  tensor([[224606.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(26072832., grad_fn=<MseLossBackward>)
output :  tensor([[242358.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5265e+11, grad_fn=<MseLossBackward>)
output :  tensor([[147663.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(439693.3125, grad_fn=<MseLossBackward>)
output :  tensor([[109026.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(298354.9375, grad_fn=<MseLossBackward>)
output :  tensor([[170157.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3788e+08, grad_fn=<MseLossBackward>)
output :  tensor([[153352.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(8134795.5000, grad_fn=<MseLossBackward>)
output :  tensor([[233828.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(10055736., grad_fn=<MseLossBackward>)
output :  tensor([[117738.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(7496986.5000, grad_fn=<MseLossBackward>)
output :  tensor([[182046.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(728488.9375, grad_fn=<MseLossBackward>)
output :  tensor([[185467.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1518555.6250, grad_fn=<MseLossBackward>)
output :  tensor([[165176.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3970e+10, grad_fn=<MseLossBackward>)
output :  tensor([[95878.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2138e+08, grad_fn=<MseLossBackward>)
output :  tensor([[240968.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3873147., grad_fn=<MseLossBackward>)
output :  tensor([[179085.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(9522914., grad_fn=<MseLossBackward>)
output :  tensor([[141428.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2041058.6250, grad_fn=<MseLossBackward>)
output :  tensor([[231020.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(15832814., grad_fn=<MseLossBackward>)
output :  tensor([[163795.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(632671.1250, grad_fn=<MseLossBackward>)
output :  tensor([[202095.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5106e+10, grad_fn=<MseLossBackward>)
output :  tensor([[135674.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(454971.3438, grad_fn=<MseLossBackward>)
output :  tensor([[187432.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4682e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137529.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2339226.7500, grad_fn=<MseLossBackward>)
output :  tensor([[224250.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3805e+08, grad_fn=<MseLossBackward>)
output :  tensor([[225578.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9643e+08, grad_fn=<MseLossBackward>)
output :  tensor([[93224.]], grad_fn=<AddmmBackward>)
loss:  tensor(10394176., grad_fn=<MseLossBackward>)
output :  tensor([[159062.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(138279.3906, grad_fn=<MseLossBackward>)
output :  tensor([[243605.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6198e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144685.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(98890.5938, grad_fn=<MseLossBackward>)
output :  tensor([[108774.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7451e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161820.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(7181227.5000, grad_fn=<MseLossBackward>)
output :  tensor([[142109.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(3573163.2500, grad_fn=<MseLossBackward>)
output :  tensor([[128499.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(89639.4219, grad_fn=<MseLossBackward>)
output :  tensor([[190668.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6692e+09, grad_fn=<MseLossBackward>)
output :  tensor([[122375.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(15525.5498, grad_fn=<MseLossBackward>)
output :  tensor([[150898.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1213784.2500, grad_fn=<MseLossBackward>)
output :  tensor([[169024.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(7428520.5000, grad_fn=<MseLossBackward>)
output :  tensor([[150380.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(383528.6250, grad_fn=<MseLossBackward>)
output :  tensor([[161171.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2989333., grad_fn=<MseLossBackward>)
output :  tensor([[136298.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4519e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134830.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(8009165.5000, grad_fn=<MseLossBackward>)
output :  tensor([[154753.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4816e+08, grad_fn=<MseLossBackward>)
output :  tensor([[144404.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(63914.1602, grad_fn=<MseLossBackward>)
output :  tensor([[165167.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(11680374., grad_fn=<MseLossBackward>)
output :  tensor([[139846.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(8.9679e+08, grad_fn=<MseLossBackward>)
output :  tensor([[150288.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2216748.7500, grad_fn=<MseLossBackward>)
output :  tensor([[184753.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(10538139., grad_fn=<MseLossBackward>)
output :  tensor([[168194.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(648905.7500, grad_fn=<MseLossBackward>)
output :  tensor([[181829.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3347642., grad_fn=<MseLossBackward>)
output :  tensor([[222077.]], grad_fn=<AddmmBackward>)
loss:  tensor(4313929., grad_fn=<MseLossBackward>)
output :  tensor([[112186.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(18369996., grad_fn=<MseLossBackward>)
output :  tensor([[139091.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0139e+08, grad_fn=<MseLossBackward>)
output :  tensor([[285913.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(7439.0625, grad_fn=<MseLossBackward>)
output :  tensor([[119973.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(15786033., grad_fn=<MseLossBackward>)
output :  tensor([[174474.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0726e+09, grad_fn=<MseLossBackward>)
output :  tensor([[190470.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(29923636., grad_fn=<MseLossBackward>)
output :  tensor([[186470.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(941627.6250, grad_fn=<MseLossBackward>)
output :  tensor([[252563.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0338e+08, grad_fn=<MseLossBackward>)
output :  tensor([[222907.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(822989.1875, grad_fn=<MseLossBackward>)
output :  tensor([[133963.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8757e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176457.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5026e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128225.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(17853794., grad_fn=<MseLossBackward>)
output :  tensor([[184176.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4823e+10, grad_fn=<MseLossBackward>)
output :  tensor([[154037.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1077281.8750, grad_fn=<MseLossBackward>)
output :  tensor([[155795.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(86408064., grad_fn=<MseLossBackward>)
output :  tensor([[205988.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(96934.9297, grad_fn=<MseLossBackward>)
output :  tensor([[144743.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4990e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176210.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(44283.9414, grad_fn=<MseLossBackward>)
output :  tensor([[247979.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9353e+08, grad_fn=<MseLossBackward>)
output :  tensor([[147555.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(197885.9688, grad_fn=<MseLossBackward>)
output :  tensor([[200486.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(4745522., grad_fn=<MseLossBackward>)
output :  tensor([[166215.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(39252380., grad_fn=<MseLossBackward>)
output :  tensor([[125868.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4340e+09, grad_fn=<MseLossBackward>)
output :  tensor([[135416.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(111347.3438, grad_fn=<MseLossBackward>)
output :  tensor([[181463.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(6435576., grad_fn=<MseLossBackward>)
output :  tensor([[194637.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(21504232., grad_fn=<MseLossBackward>)
output :  tensor([[221613.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5409e+09, grad_fn=<MseLossBackward>)
output :  tensor([[257900.]], grad_fn=<AddmmBackward>)
loss:  tensor(810000., grad_fn=<MseLossBackward>)
output :  tensor([[181703.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8850e+10, grad_fn=<MseLossBackward>)
output :  tensor([[142717.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6232e+09, grad_fn=<MseLossBackward>)
output :  tensor([[149622.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(26235204., grad_fn=<MseLossBackward>)
output :  tensor([[72557.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0600e+09, grad_fn=<MseLossBackward>)
output :  tensor([[141679.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(44616764., grad_fn=<MseLossBackward>)
output :  tensor([[128512.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(149811.3281, grad_fn=<MseLossBackward>)
output :  tensor([[154111.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(12509.0244, grad_fn=<MseLossBackward>)
output :  tensor([[128680.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(2822531.2500, grad_fn=<MseLossBackward>)
output :  tensor([[76542.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1782.4229, grad_fn=<MseLossBackward>)
output :  tensor([[84018.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(4073774.5000, grad_fn=<MseLossBackward>)
output :  tensor([[237078.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(25786878., grad_fn=<MseLossBackward>)
output :  tensor([[141088.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1730e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135311.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(23152186., grad_fn=<MseLossBackward>)
output :  tensor([[167543.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(294950.8125, grad_fn=<MseLossBackward>)
output :  tensor([[231469.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(12467189., grad_fn=<MseLossBackward>)
output :  tensor([[187213.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(24269016., grad_fn=<MseLossBackward>)
output :  tensor([[153624.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(5643891., grad_fn=<MseLossBackward>)
output :  tensor([[196599.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1692316.3750, grad_fn=<MseLossBackward>)
output :  tensor([[197499.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5603e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136282.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(514828.6875, grad_fn=<MseLossBackward>)
output :  tensor([[155917.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(841032.3125, grad_fn=<MseLossBackward>)
output :  tensor([[134881.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1250762.6250, grad_fn=<MseLossBackward>)
output :  tensor([[197626.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0481e+09, grad_fn=<MseLossBackward>)
output :  tensor([[153460.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(291245.7188, grad_fn=<MseLossBackward>)
output :  tensor([[137431.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9300e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144305.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(353467.4062, grad_fn=<MseLossBackward>)
output :  tensor([[208134.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(14944990., grad_fn=<MseLossBackward>)
output :  tensor([[104356.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9983e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166673.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(683567.2500, grad_fn=<MseLossBackward>)
output :  tensor([[128280.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(78697.7812, grad_fn=<MseLossBackward>)
output :  tensor([[143971.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(9170866., grad_fn=<MseLossBackward>)
output :  tensor([[107513.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0367e+09, grad_fn=<MseLossBackward>)
output :  tensor([[138791.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1666761.7500, grad_fn=<MseLossBackward>)
output :  tensor([[234044.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3822086., grad_fn=<MseLossBackward>)
output :  tensor([[144995.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(16.1252, grad_fn=<MseLossBackward>)
output :  tensor([[139163.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2768792., grad_fn=<MseLossBackward>)
output :  tensor([[164389.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3242e+09, grad_fn=<MseLossBackward>)
output :  tensor([[265563.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5466e+08, grad_fn=<MseLossBackward>)
output :  tensor([[171285.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(13798903., grad_fn=<MseLossBackward>)
output :  tensor([[104231.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2118025.5000, grad_fn=<MseLossBackward>)
output :  tensor([[199631.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0635e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157471.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2336169., grad_fn=<MseLossBackward>)
output :  tensor([[162999.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5979e+10, grad_fn=<MseLossBackward>)
output :  tensor([[99937.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2681099.2500, grad_fn=<MseLossBackward>)
output :  tensor([[123410.]], grad_fn=<AddmmBackward>)
loss:  tensor(36100., grad_fn=<MseLossBackward>)
output :  tensor([[154140.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(3459542., grad_fn=<MseLossBackward>)
output :  tensor([[142149.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(4619678.5000, grad_fn=<MseLossBackward>)
output :  tensor([[200233.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(54339.9805, grad_fn=<MseLossBackward>)
output :  tensor([[141154.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(714949.5000, grad_fn=<MseLossBackward>)
output :  tensor([[257419.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(23624156., grad_fn=<MseLossBackward>)
output :  tensor([[126386.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1146e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166230.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(533310.6875, grad_fn=<MseLossBackward>)
output :  tensor([[188178.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(103412.4922, grad_fn=<MseLossBackward>)
output :  tensor([[123027.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6971e+08, grad_fn=<MseLossBackward>)
output :  tensor([[249817.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(33232.1523, grad_fn=<MseLossBackward>)
output :  tensor([[158915.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8873e+08, grad_fn=<MseLossBackward>)
output :  tensor([[245851.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(251251.5625, grad_fn=<MseLossBackward>)
output :  tensor([[144083.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(6894.1885, grad_fn=<MseLossBackward>)
output :  tensor([[214707.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(22156732., grad_fn=<MseLossBackward>)
output :  tensor([[174736.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(5458575., grad_fn=<MseLossBackward>)
output :  tensor([[153916.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(7035.0156, grad_fn=<MseLossBackward>)
output :  tensor([[118149.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(22294.2227, grad_fn=<MseLossBackward>)
output :  tensor([[238421.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3686e+09, grad_fn=<MseLossBackward>)
output :  tensor([[238431.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2459653., grad_fn=<MseLossBackward>)
output :  tensor([[152131.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1452100.3750, grad_fn=<MseLossBackward>)
output :  tensor([[254041.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(736673.5000, grad_fn=<MseLossBackward>)
output :  tensor([[123936.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(88974560., grad_fn=<MseLossBackward>)
output :  tensor([[180049.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(16399336., grad_fn=<MseLossBackward>)
output :  tensor([[164312.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(18595366., grad_fn=<MseLossBackward>)
output :  tensor([[129966.4922]], grad_fn=<AddmmBackward>)
loss:  tensor(1068138.3750, grad_fn=<MseLossBackward>)
output :  tensor([[195743.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3882e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163319.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(463526.9375, grad_fn=<MseLossBackward>)
output :  tensor([[167984.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(24844928., grad_fn=<MseLossBackward>)
output :  tensor([[159280.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1640640.7500, grad_fn=<MseLossBackward>)
output :  tensor([[145825.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(16604734., grad_fn=<MseLossBackward>)
output :  tensor([[177200.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5834e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163941.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(15536531., grad_fn=<MseLossBackward>)
output :  tensor([[377617.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(40348700., grad_fn=<MseLossBackward>)
output :  tensor([[119656.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(53933072., grad_fn=<MseLossBackward>)
output :  tensor([[129662.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9503e+09, grad_fn=<MseLossBackward>)
output :  tensor([[282664.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2106126.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162860.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(740944.3750, grad_fn=<MseLossBackward>)
output :  tensor([[131064.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1160e+08, grad_fn=<MseLossBackward>)
output :  tensor([[227757.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(17998938., grad_fn=<MseLossBackward>)
output :  tensor([[183632.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(9814123., grad_fn=<MseLossBackward>)
output :  tensor([[153925.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(3705865.7500, grad_fn=<MseLossBackward>)
output :  tensor([[144682.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(100974.9922, grad_fn=<MseLossBackward>)
output :  tensor([[154002.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9250e+08, grad_fn=<MseLossBackward>)
output :  tensor([[100824.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(679684.3125, grad_fn=<MseLossBackward>)
output :  tensor([[79651.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8617e+08, grad_fn=<MseLossBackward>)
output :  tensor([[164125.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(763903.3125, grad_fn=<MseLossBackward>)
output :  tensor([[185772.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7832e+09, grad_fn=<MseLossBackward>)
output :  tensor([[160167.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(4699208., grad_fn=<MseLossBackward>)
output :  tensor([[162287.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(22915818., grad_fn=<MseLossBackward>)
output :  tensor([[136202.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1556919., grad_fn=<MseLossBackward>)
output :  tensor([[208914.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(8789835., grad_fn=<MseLossBackward>)
output :  tensor([[138207.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(42881.3516, grad_fn=<MseLossBackward>)
output :  tensor([[180031.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6892e+10, grad_fn=<MseLossBackward>)
output :  tensor([[142576.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(11719175., grad_fn=<MseLossBackward>)
output :  tensor([[111357.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0415e+08, grad_fn=<MseLossBackward>)
output :  tensor([[95990.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(3962152.5000, grad_fn=<MseLossBackward>)
output :  tensor([[175408.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(166999.9375, grad_fn=<MseLossBackward>)
output :  tensor([[265613.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(27183514., grad_fn=<MseLossBackward>)
output :  tensor([[142218.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(516376.9688, grad_fn=<MseLossBackward>)
output :  tensor([[161126.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1515784.1250, grad_fn=<MseLossBackward>)
output :  tensor([[132409.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(8147.8828, grad_fn=<MseLossBackward>)
output :  tensor([[153385.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(15096503., grad_fn=<MseLossBackward>)
output :  tensor([[169512.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2601466.5000, grad_fn=<MseLossBackward>)
output :  tensor([[126160.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(705180.0625, grad_fn=<MseLossBackward>)
output :  tensor([[174045.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4365e+08, grad_fn=<MseLossBackward>)
output :  tensor([[157008.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(72.2500, grad_fn=<MseLossBackward>)
output :  tensor([[118928.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(5895336., grad_fn=<MseLossBackward>)
output :  tensor([[159479.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4052e+09, grad_fn=<MseLossBackward>)
output :  tensor([[54890.2227]], grad_fn=<AddmmBackward>)
loss:  tensor(8353387., grad_fn=<MseLossBackward>)
output :  tensor([[229654.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8634e+09, grad_fn=<MseLossBackward>)
output :  tensor([[200914.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(7299.5664, grad_fn=<MseLossBackward>)
output :  tensor([[181525.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(12073996., grad_fn=<MseLossBackward>)
output :  tensor([[108027.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(4112689., grad_fn=<MseLossBackward>)
output :  tensor([[85158.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3391007.2500, grad_fn=<MseLossBackward>)
output :  tensor([[140698.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(488098.7188, grad_fn=<MseLossBackward>)
output :  tensor([[217805.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8057e+09, grad_fn=<MseLossBackward>)
output :  tensor([[199616.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(62156472., grad_fn=<MseLossBackward>)
output :  tensor([[169882.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(23842926., grad_fn=<MseLossBackward>)
output :  tensor([[169986.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(9.0275e+09, grad_fn=<MseLossBackward>)
output :  tensor([[189593.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(164848.6875, grad_fn=<MseLossBackward>)
output :  tensor([[88203.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(1449446.7500, grad_fn=<MseLossBackward>)
output :  tensor([[138931.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1142694.2500, grad_fn=<MseLossBackward>)
output :  tensor([[108851.]], grad_fn=<AddmmBackward>)
loss:  tensor(2719201., grad_fn=<MseLossBackward>)
output :  tensor([[150340.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0679e+08, grad_fn=<MseLossBackward>)
output :  tensor([[171035.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6029e+09, grad_fn=<MseLossBackward>)
output :  tensor([[196470.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(72747576., grad_fn=<MseLossBackward>)
output :  tensor([[177590.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(5804561., grad_fn=<MseLossBackward>)
output :  tensor([[99110.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(6813568., grad_fn=<MseLossBackward>)
output :  tensor([[117480.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(386.6754, grad_fn=<MseLossBackward>)
output :  tensor([[158218.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6468e+08, grad_fn=<MseLossBackward>)
output :  tensor([[196873.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(9774025., grad_fn=<MseLossBackward>)
output :  tensor([[141423.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(6639318.5000, grad_fn=<MseLossBackward>)
train_loss: [2.6443988e+09]
epoch_result tensor([0.])
output :  tensor([[158799.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(89840.6953, grad_fn=<MseLossBackward>)
output :  tensor([[120818.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1396717.7500, grad_fn=<MseLossBackward>)
output :  tensor([[194836.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(403363.9062, grad_fn=<MseLossBackward>)
output :  tensor([[178083.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1173058.2500, grad_fn=<MseLossBackward>)
output :  tensor([[153661.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9234e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128912.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(831829.5000, grad_fn=<MseLossBackward>)
output :  tensor([[142104.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1220472.5000, grad_fn=<MseLossBackward>)
output :  tensor([[120581.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(2500079.7500, grad_fn=<MseLossBackward>)
output :  tensor([[69534.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2176e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165793.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(42616.4414, grad_fn=<MseLossBackward>)
output :  tensor([[148978.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(80619912., grad_fn=<MseLossBackward>)
output :  tensor([[224530.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(220782.5156, grad_fn=<MseLossBackward>)
output :  tensor([[169921.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(849191.0625, grad_fn=<MseLossBackward>)
output :  tensor([[246738.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(8767984., grad_fn=<MseLossBackward>)
output :  tensor([[55925.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(856622.5625, grad_fn=<MseLossBackward>)
output :  tensor([[163087.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4548e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174070.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(864464.1250, grad_fn=<MseLossBackward>)
output :  tensor([[153614.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(8324307., grad_fn=<MseLossBackward>)
output :  tensor([[274216.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(614117.1250, grad_fn=<MseLossBackward>)
output :  tensor([[196025.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(949315.3125, grad_fn=<MseLossBackward>)
output :  tensor([[137195.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5792e+10, grad_fn=<MseLossBackward>)
output :  tensor([[193283.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(354787.7500, grad_fn=<MseLossBackward>)
output :  tensor([[176718.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3215e+09, grad_fn=<MseLossBackward>)
output :  tensor([[152104.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1219782.2500, grad_fn=<MseLossBackward>)
output :  tensor([[166210.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(14357350., grad_fn=<MseLossBackward>)
output :  tensor([[85811.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(169043.0312, grad_fn=<MseLossBackward>)
output :  tensor([[167617.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9830e+09, grad_fn=<MseLossBackward>)
output :  tensor([[186689.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2855572., grad_fn=<MseLossBackward>)
output :  tensor([[202847.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7723e+09, grad_fn=<MseLossBackward>)
output :  tensor([[109572.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(182903.2344, grad_fn=<MseLossBackward>)
output :  tensor([[169433.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2454558.7500, grad_fn=<MseLossBackward>)
output :  tensor([[137351.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(725611.1250, grad_fn=<MseLossBackward>)
output :  tensor([[131498.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(6243049., grad_fn=<MseLossBackward>)
output :  tensor([[121949.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(6000701., grad_fn=<MseLossBackward>)
output :  tensor([[147538.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(9.3258e+08, grad_fn=<MseLossBackward>)
output :  tensor([[169960.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1037e+10, grad_fn=<MseLossBackward>)
output :  tensor([[147075.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(6886606., grad_fn=<MseLossBackward>)
output :  tensor([[180804.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(646918.6250, grad_fn=<MseLossBackward>)
output :  tensor([[144262.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(10641460., grad_fn=<MseLossBackward>)
output :  tensor([[110334.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1351e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136028.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2365e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137086.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(4355438.5000, grad_fn=<MseLossBackward>)
output :  tensor([[137475.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0973e+08, grad_fn=<MseLossBackward>)
output :  tensor([[224063.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(876768.8750, grad_fn=<MseLossBackward>)
output :  tensor([[131157.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1193624.5000, grad_fn=<MseLossBackward>)
output :  tensor([[155894.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(47535208., grad_fn=<MseLossBackward>)
output :  tensor([[109289.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(7344142.5000, grad_fn=<MseLossBackward>)
output :  tensor([[161494.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2234464.5000, grad_fn=<MseLossBackward>)
output :  tensor([[149372.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0819e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194388.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(5705454.5000, grad_fn=<MseLossBackward>)
output :  tensor([[134025.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(180598.4375, grad_fn=<MseLossBackward>)
output :  tensor([[111861.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(3464949.5000, grad_fn=<MseLossBackward>)
output :  tensor([[230687.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(10974830., grad_fn=<MseLossBackward>)
output :  tensor([[164453.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4046e+09, grad_fn=<MseLossBackward>)
output :  tensor([[155121.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(15044580., grad_fn=<MseLossBackward>)
output :  tensor([[202772.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8807e+10, grad_fn=<MseLossBackward>)
output :  tensor([[249885.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0840e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143875.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(140941.5781, grad_fn=<MseLossBackward>)
output :  tensor([[136528.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(6395129.5000, grad_fn=<MseLossBackward>)
output :  tensor([[160892.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(34717320., grad_fn=<MseLossBackward>)
output :  tensor([[131415.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2003109.5000, grad_fn=<MseLossBackward>)
output :  tensor([[181259.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2000e+09, grad_fn=<MseLossBackward>)
output :  tensor([[181228.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(8245691.5000, grad_fn=<MseLossBackward>)
output :  tensor([[165269.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(14209484., grad_fn=<MseLossBackward>)
output :  tensor([[143240.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(57915.4297, grad_fn=<MseLossBackward>)
output :  tensor([[144891.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(5717329.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145004.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(18.5977, grad_fn=<MseLossBackward>)
output :  tensor([[171973.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5850e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194681.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9810e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136467.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1060.3164, grad_fn=<MseLossBackward>)
output :  tensor([[174207.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(5325277.5000, grad_fn=<MseLossBackward>)
output :  tensor([[179653.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1811926.3750, grad_fn=<MseLossBackward>)
output :  tensor([[115194.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(37897.1406, grad_fn=<MseLossBackward>)
output :  tensor([[218303.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(7271618., grad_fn=<MseLossBackward>)
output :  tensor([[183836.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(113432.1328, grad_fn=<MseLossBackward>)
output :  tensor([[123729.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(3134200., grad_fn=<MseLossBackward>)
output :  tensor([[198160.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2758661.5000, grad_fn=<MseLossBackward>)
output :  tensor([[175651.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(565410., grad_fn=<MseLossBackward>)
output :  tensor([[207556.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1931e+10, grad_fn=<MseLossBackward>)
output :  tensor([[211423.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(179365.4844, grad_fn=<MseLossBackward>)
output :  tensor([[169304.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4672e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195301.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(643078.6875, grad_fn=<MseLossBackward>)
output :  tensor([[113350.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(122800.9688, grad_fn=<MseLossBackward>)
output :  tensor([[113675.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1381175.8750, grad_fn=<MseLossBackward>)
output :  tensor([[113452.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2109347.7500, grad_fn=<MseLossBackward>)
output :  tensor([[146957.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(24717.7344, grad_fn=<MseLossBackward>)
output :  tensor([[160933.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3018e+10, grad_fn=<MseLossBackward>)
output :  tensor([[179302.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(487073.1250, grad_fn=<MseLossBackward>)
output :  tensor([[130206.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(7327299., grad_fn=<MseLossBackward>)
output :  tensor([[144602.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(157633.8125, grad_fn=<MseLossBackward>)
output :  tensor([[184972.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5073e+09, grad_fn=<MseLossBackward>)
output :  tensor([[117289.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(151740.6875, grad_fn=<MseLossBackward>)
output :  tensor([[190169.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(46659572., grad_fn=<MseLossBackward>)
output :  tensor([[147333.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(5446826.5000, grad_fn=<MseLossBackward>)
output :  tensor([[217769.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(23711422., grad_fn=<MseLossBackward>)
output :  tensor([[128594.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(6732889.5000, grad_fn=<MseLossBackward>)
output :  tensor([[245717.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(6812834., grad_fn=<MseLossBackward>)
output :  tensor([[236176.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3837e+09, grad_fn=<MseLossBackward>)
output :  tensor([[149840.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4004e+08, grad_fn=<MseLossBackward>)
output :  tensor([[85249.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8804e+08, grad_fn=<MseLossBackward>)
output :  tensor([[191155.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0131e+09, grad_fn=<MseLossBackward>)
output :  tensor([[81449.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(201895.7656, grad_fn=<MseLossBackward>)
output :  tensor([[138277.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1495652.6250, grad_fn=<MseLossBackward>)
output :  tensor([[76941.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(2078710.6250, grad_fn=<MseLossBackward>)
output :  tensor([[145516.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(6570971.5000, grad_fn=<MseLossBackward>)
output :  tensor([[177261.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1591934.2500, grad_fn=<MseLossBackward>)
output :  tensor([[154473.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(946759.4375, grad_fn=<MseLossBackward>)
output :  tensor([[109693.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(5261002.5000, grad_fn=<MseLossBackward>)
output :  tensor([[201615.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3027e+10, grad_fn=<MseLossBackward>)
output :  tensor([[128280.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(48331.2734, grad_fn=<MseLossBackward>)
output :  tensor([[267685.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5164e+08, grad_fn=<MseLossBackward>)
output :  tensor([[303221.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(45951876., grad_fn=<MseLossBackward>)
output :  tensor([[106497.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(1004614.6875, grad_fn=<MseLossBackward>)
output :  tensor([[171741.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(574824.5625, grad_fn=<MseLossBackward>)
output :  tensor([[134120.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8229e+08, grad_fn=<MseLossBackward>)
output :  tensor([[143635.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(21483370., grad_fn=<MseLossBackward>)
output :  tensor([[126655.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(12917117., grad_fn=<MseLossBackward>)
output :  tensor([[127727.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(7441899., grad_fn=<MseLossBackward>)
output :  tensor([[138276.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2811e+08, grad_fn=<MseLossBackward>)
output :  tensor([[227473.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8230e+10, grad_fn=<MseLossBackward>)
output :  tensor([[185456.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4194e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144334.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(188450.9531, grad_fn=<MseLossBackward>)
output :  tensor([[129961.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(6060597.5000, grad_fn=<MseLossBackward>)
output :  tensor([[108656.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(6728106.5000, grad_fn=<MseLossBackward>)
output :  tensor([[254175.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0814e+09, grad_fn=<MseLossBackward>)
output :  tensor([[132901.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(4403046.5000, grad_fn=<MseLossBackward>)
output :  tensor([[200213.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(7763624.5000, grad_fn=<MseLossBackward>)
output :  tensor([[102295.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(6781385.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140200.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(62993.1562, grad_fn=<MseLossBackward>)
output :  tensor([[204975.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8120e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178379.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2313108.2500, grad_fn=<MseLossBackward>)
output :  tensor([[186369.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1876728.7500, grad_fn=<MseLossBackward>)
output :  tensor([[162807.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1372e+10, grad_fn=<MseLossBackward>)
output :  tensor([[297240.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4257e+09, grad_fn=<MseLossBackward>)
output :  tensor([[196998.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(812871.3125, grad_fn=<MseLossBackward>)
output :  tensor([[258846.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0740e+10, grad_fn=<MseLossBackward>)
output :  tensor([[218147.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2899e+09, grad_fn=<MseLossBackward>)
output :  tensor([[276963.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6030e+09, grad_fn=<MseLossBackward>)
output :  tensor([[221556.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(5972830.5000, grad_fn=<MseLossBackward>)
output :  tensor([[222491.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8733e+10, grad_fn=<MseLossBackward>)
output :  tensor([[194723.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(5181883., grad_fn=<MseLossBackward>)
output :  tensor([[161152.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0338e+09, grad_fn=<MseLossBackward>)
output :  tensor([[127717.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(22870214., grad_fn=<MseLossBackward>)
output :  tensor([[136535.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1073004.6250, grad_fn=<MseLossBackward>)
output :  tensor([[90844.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(24262.9297, grad_fn=<MseLossBackward>)
output :  tensor([[107991.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(69.7486, grad_fn=<MseLossBackward>)
output :  tensor([[272784.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1489e+09, grad_fn=<MseLossBackward>)
output :  tensor([[231834.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(10019797., grad_fn=<MseLossBackward>)
output :  tensor([[147560.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(6558481., grad_fn=<MseLossBackward>)
output :  tensor([[137634.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(18052.4414, grad_fn=<MseLossBackward>)
output :  tensor([[175420.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2847023.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144467.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(612526.3750, grad_fn=<MseLossBackward>)
output :  tensor([[165083.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(8.6535e+08, grad_fn=<MseLossBackward>)
output :  tensor([[168234.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(10463405., grad_fn=<MseLossBackward>)
output :  tensor([[138282.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1645607.8750, grad_fn=<MseLossBackward>)
output :  tensor([[189837.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5343e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113296.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1681520., grad_fn=<MseLossBackward>)
output :  tensor([[163242.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(76693256., grad_fn=<MseLossBackward>)
output :  tensor([[119334.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(442287.3438, grad_fn=<MseLossBackward>)
output :  tensor([[88063.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(1131746.8750, grad_fn=<MseLossBackward>)
output :  tensor([[179530.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(220826.5625, grad_fn=<MseLossBackward>)
output :  tensor([[108557.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1801006., grad_fn=<MseLossBackward>)
output :  tensor([[233714.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(27932546., grad_fn=<MseLossBackward>)
output :  tensor([[245994.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(988999.1875, grad_fn=<MseLossBackward>)
output :  tensor([[127713.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(3192587.2500, grad_fn=<MseLossBackward>)
output :  tensor([[109641.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(465337.1562, grad_fn=<MseLossBackward>)
output :  tensor([[289326.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1853e+10, grad_fn=<MseLossBackward>)
output :  tensor([[170778.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(521261.4375, grad_fn=<MseLossBackward>)
output :  tensor([[127296.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(5272836., grad_fn=<MseLossBackward>)
output :  tensor([[146148.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9233e+08, grad_fn=<MseLossBackward>)
output :  tensor([[198517.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3970e+08, grad_fn=<MseLossBackward>)
output :  tensor([[141291.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(84917.6016, grad_fn=<MseLossBackward>)
output :  tensor([[156320.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5297e+10, grad_fn=<MseLossBackward>)
output :  tensor([[155636.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3015866.5000, grad_fn=<MseLossBackward>)
output :  tensor([[131475.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(3904082., grad_fn=<MseLossBackward>)
output :  tensor([[242772.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8422e+10, grad_fn=<MseLossBackward>)
output :  tensor([[400612.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1925850., grad_fn=<MseLossBackward>)
output :  tensor([[103517.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(30054552., grad_fn=<MseLossBackward>)
output :  tensor([[114303.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(17609694., grad_fn=<MseLossBackward>)
output :  tensor([[161338.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(3381806., grad_fn=<MseLossBackward>)
output :  tensor([[131548.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0406e+08, grad_fn=<MseLossBackward>)
output :  tensor([[162885.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4945e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173977.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0931e+09, grad_fn=<MseLossBackward>)
output :  tensor([[103965.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(133675.9219, grad_fn=<MseLossBackward>)
output :  tensor([[137610.]], grad_fn=<AddmmBackward>)
loss:  tensor(11492100., grad_fn=<MseLossBackward>)
output :  tensor([[363077.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(17781244., grad_fn=<MseLossBackward>)
output :  tensor([[201470.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7593e+09, grad_fn=<MseLossBackward>)
output :  tensor([[176043.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(294950.8125, grad_fn=<MseLossBackward>)
output :  tensor([[197989.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(24113010., grad_fn=<MseLossBackward>)
output :  tensor([[141943.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(8662445., grad_fn=<MseLossBackward>)
output :  tensor([[194233.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(70963.9688, grad_fn=<MseLossBackward>)
output :  tensor([[136113.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1871e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179239.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3098370., grad_fn=<MseLossBackward>)
output :  tensor([[240708.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1669102.5000, grad_fn=<MseLossBackward>)
output :  tensor([[175994.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(3979339.2500, grad_fn=<MseLossBackward>)
output :  tensor([[107404.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(354071.5000, grad_fn=<MseLossBackward>)
output :  tensor([[266885.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(5404462.5000, grad_fn=<MseLossBackward>)
output :  tensor([[250808.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(653773.3125, grad_fn=<MseLossBackward>)
output :  tensor([[123218.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(47578.5156, grad_fn=<MseLossBackward>)
output :  tensor([[215253.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5697e+09, grad_fn=<MseLossBackward>)
output :  tensor([[304106.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4915e+08, grad_fn=<MseLossBackward>)
output :  tensor([[206777.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(49471.4922, grad_fn=<MseLossBackward>)
output :  tensor([[213491.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6005e+10, grad_fn=<MseLossBackward>)
output :  tensor([[160350.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(6006788.5000, grad_fn=<MseLossBackward>)
output :  tensor([[174649.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(21706718., grad_fn=<MseLossBackward>)
output :  tensor([[160165.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(10457442., grad_fn=<MseLossBackward>)
output :  tensor([[173227.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(10415243., grad_fn=<MseLossBackward>)
output :  tensor([[233306.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2037e+09, grad_fn=<MseLossBackward>)
output :  tensor([[212862.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7533e+08, grad_fn=<MseLossBackward>)
output :  tensor([[161783.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1855e+08, grad_fn=<MseLossBackward>)
output :  tensor([[122484.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(265377.9062, grad_fn=<MseLossBackward>)
output :  tensor([[177643.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(414655.5000, grad_fn=<MseLossBackward>)
output :  tensor([[178739.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6033e+09, grad_fn=<MseLossBackward>)
output :  tensor([[205154.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5896e+10, grad_fn=<MseLossBackward>)
output :  tensor([[133627.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(647295.6875, grad_fn=<MseLossBackward>)
output :  tensor([[152051.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2729e+08, grad_fn=<MseLossBackward>)
output :  tensor([[275205.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3219669.5000, grad_fn=<MseLossBackward>)
output :  tensor([[86557.]], grad_fn=<AddmmBackward>)
loss:  tensor(2424249., grad_fn=<MseLossBackward>)
output :  tensor([[235432.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1140290.2500, grad_fn=<MseLossBackward>)
output :  tensor([[258573.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0521e+11, grad_fn=<MseLossBackward>)
output :  tensor([[173901.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(15218045., grad_fn=<MseLossBackward>)
output :  tensor([[192558.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8013e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150434.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(20843076., grad_fn=<MseLossBackward>)
output :  tensor([[204982.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2272e+09, grad_fn=<MseLossBackward>)
output :  tensor([[129472.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(223226.7188, grad_fn=<MseLossBackward>)
output :  tensor([[145939.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(881779.6875, grad_fn=<MseLossBackward>)
output :  tensor([[173302.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(9.4876e+08, grad_fn=<MseLossBackward>)
output :  tensor([[185173.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(458075.1562, grad_fn=<MseLossBackward>)
output :  tensor([[125028.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(943797.0625, grad_fn=<MseLossBackward>)
output :  tensor([[138228.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2989333., grad_fn=<MseLossBackward>)
output :  tensor([[172197.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(643931., grad_fn=<MseLossBackward>)
output :  tensor([[200467.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4535e+09, grad_fn=<MseLossBackward>)
output :  tensor([[241931.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1140891., grad_fn=<MseLossBackward>)
output :  tensor([[153816.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1401190.1250, grad_fn=<MseLossBackward>)
output :  tensor([[194601.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1955933.3750, grad_fn=<MseLossBackward>)
output :  tensor([[164420.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1701e+08, grad_fn=<MseLossBackward>)
output :  tensor([[188189.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(75505240., grad_fn=<MseLossBackward>)
output :  tensor([[181633.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3004914., grad_fn=<MseLossBackward>)
output :  tensor([[99909.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(8464372., grad_fn=<MseLossBackward>)
output :  tensor([[172914.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1467e+10, grad_fn=<MseLossBackward>)
output :  tensor([[133906.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1196220.7500, grad_fn=<MseLossBackward>)
output :  tensor([[120972.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(35667212., grad_fn=<MseLossBackward>)
output :  tensor([[171791.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(4876644., grad_fn=<MseLossBackward>)
output :  tensor([[84057.1016]], grad_fn=<AddmmBackward>)
loss:  tensor(889057.4375, grad_fn=<MseLossBackward>)
output :  tensor([[289407.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(351574.8750, grad_fn=<MseLossBackward>)
output :  tensor([[168817.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(14574261., grad_fn=<MseLossBackward>)
output :  tensor([[191142.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0171e+10, grad_fn=<MseLossBackward>)
output :  tensor([[243815.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3898e+08, grad_fn=<MseLossBackward>)
output :  tensor([[149926.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1152972.6250, grad_fn=<MseLossBackward>)
output :  tensor([[124148.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(22196.3438, grad_fn=<MseLossBackward>)
output :  tensor([[122628.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(7442623.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145581.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(9.3520e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174369.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(136876.8750, grad_fn=<MseLossBackward>)
output :  tensor([[113505.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6133e+08, grad_fn=<MseLossBackward>)
output :  tensor([[210897.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1471e+10, grad_fn=<MseLossBackward>)
output :  tensor([[229437.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4549e+08, grad_fn=<MseLossBackward>)
output :  tensor([[251863.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0543e+10, grad_fn=<MseLossBackward>)
output :  tensor([[223536.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3912e+08, grad_fn=<MseLossBackward>)
output :  tensor([[195028.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4513e+10, grad_fn=<MseLossBackward>)
output :  tensor([[190549.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(9298116., grad_fn=<MseLossBackward>)
output :  tensor([[207119.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7415e+10, grad_fn=<MseLossBackward>)
output :  tensor([[188353.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1800e+10, grad_fn=<MseLossBackward>)
output :  tensor([[176585.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(4640725.5000, grad_fn=<MseLossBackward>)
output :  tensor([[150816.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1399784.7500, grad_fn=<MseLossBackward>)
output :  tensor([[330059.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(48167072., grad_fn=<MseLossBackward>)
output :  tensor([[213311.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1720360.1250, grad_fn=<MseLossBackward>)
output :  tensor([[160482.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(232534.9219, grad_fn=<MseLossBackward>)
output :  tensor([[185636.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1208e+09, grad_fn=<MseLossBackward>)
output :  tensor([[105021.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(454.2227, grad_fn=<MseLossBackward>)
output :  tensor([[271670.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0276e+10, grad_fn=<MseLossBackward>)
output :  tensor([[173464.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(189374.5625, grad_fn=<MseLossBackward>)
output :  tensor([[209830.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(13463969., grad_fn=<MseLossBackward>)
output :  tensor([[205964.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2606e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178690.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(259733.5625, grad_fn=<MseLossBackward>)
output :  tensor([[201829.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(869.3284, grad_fn=<MseLossBackward>)
output :  tensor([[157033.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(4133279.5000, grad_fn=<MseLossBackward>)
output :  tensor([[149801.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4802e+09, grad_fn=<MseLossBackward>)
output :  tensor([[116523.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(3907540.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139450.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(302190.7188, grad_fn=<MseLossBackward>)
output :  tensor([[147149.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(3424408., grad_fn=<MseLossBackward>)
output :  tensor([[201892.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5903e+10, grad_fn=<MseLossBackward>)
output :  tensor([[160242.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(550842.3125, grad_fn=<MseLossBackward>)
output :  tensor([[101681.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(4759726.5000, grad_fn=<MseLossBackward>)
output :  tensor([[225242.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1778e+08, grad_fn=<MseLossBackward>)
output :  tensor([[188429.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2574e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176252.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(54034.4570, grad_fn=<MseLossBackward>)
output :  tensor([[84344.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(5496533.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128206.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(85871.8906, grad_fn=<MseLossBackward>)
output :  tensor([[214691.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(478431.5938, grad_fn=<MseLossBackward>)
output :  tensor([[143636.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(132382.2812, grad_fn=<MseLossBackward>)
output :  tensor([[130336.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(113242.7656, grad_fn=<MseLossBackward>)
output :  tensor([[144498.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3604183.5000, grad_fn=<MseLossBackward>)
output :  tensor([[180824.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8770e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145933.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(3736791., grad_fn=<MseLossBackward>)
output :  tensor([[161443.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2084549.3750, grad_fn=<MseLossBackward>)
output :  tensor([[215133.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(17759.7266, grad_fn=<MseLossBackward>)
output :  tensor([[139658.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2012e+09, grad_fn=<MseLossBackward>)
output :  tensor([[257815.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(7924753., grad_fn=<MseLossBackward>)
output :  tensor([[160491.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(982607.5625, grad_fn=<MseLossBackward>)
output :  tensor([[130668.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(4703375., grad_fn=<MseLossBackward>)
output :  tensor([[94362.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(406426.1875, grad_fn=<MseLossBackward>)
output :  tensor([[158911.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5371e+09, grad_fn=<MseLossBackward>)
output :  tensor([[181062.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1352278.2500, grad_fn=<MseLossBackward>)
output :  tensor([[118520.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(3918513., grad_fn=<MseLossBackward>)
output :  tensor([[190927.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4457e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146505.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4897e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150654.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(569718.3125, grad_fn=<MseLossBackward>)
output :  tensor([[188068.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(101133.9375, grad_fn=<MseLossBackward>)
output :  tensor([[251077.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7640e+09, grad_fn=<MseLossBackward>)
output :  tensor([[91098.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(161252.4375, grad_fn=<MseLossBackward>)
output :  tensor([[231356.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(74706312., grad_fn=<MseLossBackward>)
output :  tensor([[127105.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1945327.5000, grad_fn=<MseLossBackward>)
output :  tensor([[166464.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(9.8875e+09, grad_fn=<MseLossBackward>)
output :  tensor([[114959.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2379e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178319.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(5378993., grad_fn=<MseLossBackward>)
output :  tensor([[164440.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2704e+08, grad_fn=<MseLossBackward>)
output :  tensor([[154906.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9568e+08, grad_fn=<MseLossBackward>)
output :  tensor([[239457.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(209134.7188, grad_fn=<MseLossBackward>)
output :  tensor([[228309.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8150e+08, grad_fn=<MseLossBackward>)
output :  tensor([[125995.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1008894.6875, grad_fn=<MseLossBackward>)
output :  tensor([[128253.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(5077030., grad_fn=<MseLossBackward>)
output :  tensor([[222144.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(23576184., grad_fn=<MseLossBackward>)
output :  tensor([[230416.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(12844048., grad_fn=<MseLossBackward>)
output :  tensor([[224898.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(3246528.2500, grad_fn=<MseLossBackward>)
output :  tensor([[146631.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1871808.7500, grad_fn=<MseLossBackward>)
output :  tensor([[207661.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(5467121., grad_fn=<MseLossBackward>)
output :  tensor([[128167.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(66715076., grad_fn=<MseLossBackward>)
output :  tensor([[132345.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(24000.7871, grad_fn=<MseLossBackward>)
output :  tensor([[310293.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(22152024., grad_fn=<MseLossBackward>)
output :  tensor([[142567.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2458036., grad_fn=<MseLossBackward>)
output :  tensor([[121889.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0128e+09, grad_fn=<MseLossBackward>)
output :  tensor([[106860.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(6966176.5000, grad_fn=<MseLossBackward>)
output :  tensor([[155553.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8717e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178378.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2826e+09, grad_fn=<MseLossBackward>)
output :  tensor([[171099.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(3611603.2500, grad_fn=<MseLossBackward>)
output :  tensor([[193317.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(59015284., grad_fn=<MseLossBackward>)
output :  tensor([[98114.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(3556436., grad_fn=<MseLossBackward>)
output :  tensor([[181594.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(6733700.5000, grad_fn=<MseLossBackward>)
output :  tensor([[171150.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(10567376., grad_fn=<MseLossBackward>)
output :  tensor([[139610.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(372881.9688, grad_fn=<MseLossBackward>)
output :  tensor([[259565.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9072e+09, grad_fn=<MseLossBackward>)
output :  tensor([[143315.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4007e+09, grad_fn=<MseLossBackward>)
output :  tensor([[172031.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(937719.8750, grad_fn=<MseLossBackward>)
output :  tensor([[137632.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(5603281., grad_fn=<MseLossBackward>)
output :  tensor([[197268.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(10441683., grad_fn=<MseLossBackward>)
output :  tensor([[170726.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(527166.7500, grad_fn=<MseLossBackward>)
output :  tensor([[243309.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(476596.0625, grad_fn=<MseLossBackward>)
output :  tensor([[133360.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1297641.3750, grad_fn=<MseLossBackward>)
output :  tensor([[150796.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2092859.5000, grad_fn=<MseLossBackward>)
output :  tensor([[216245.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1552282.3750, grad_fn=<MseLossBackward>)
output :  tensor([[159550.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(29693474., grad_fn=<MseLossBackward>)
output :  tensor([[199427.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0873e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134944.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7865e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130015.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1030859.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144322.]], grad_fn=<AddmmBackward>)
loss:  tensor(18679684., grad_fn=<MseLossBackward>)
output :  tensor([[202329.]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5119e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166965.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7004e+09, grad_fn=<MseLossBackward>)
output :  tensor([[76901.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8567e+08, grad_fn=<MseLossBackward>)
output :  tensor([[94812.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0636e+08, grad_fn=<MseLossBackward>)
output :  tensor([[257643.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(18924132., grad_fn=<MseLossBackward>)
output :  tensor([[202333.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0112e+09, grad_fn=<MseLossBackward>)
output :  tensor([[115783.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(614435.5000, grad_fn=<MseLossBackward>)
output :  tensor([[160920.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0649e+08, grad_fn=<MseLossBackward>)
output :  tensor([[206253.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8898e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181501.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8320e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159005.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(16044781., grad_fn=<MseLossBackward>)
output :  tensor([[169486.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(263634.1250, grad_fn=<MseLossBackward>)
output :  tensor([[115666.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(444847.3125, grad_fn=<MseLossBackward>)
output :  tensor([[164711.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(94311712., grad_fn=<MseLossBackward>)
output :  tensor([[194004.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6631e+08, grad_fn=<MseLossBackward>)
output :  tensor([[220956.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2121028.2500, grad_fn=<MseLossBackward>)
output :  tensor([[244568.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5043e+11, grad_fn=<MseLossBackward>)
output :  tensor([[146805.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(37793.7891, grad_fn=<MseLossBackward>)
output :  tensor([[108851.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(137727.9688, grad_fn=<MseLossBackward>)
output :  tensor([[169726.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4819e+08, grad_fn=<MseLossBackward>)
output :  tensor([[151350.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(722792.1875, grad_fn=<MseLossBackward>)
output :  tensor([[233726.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(10713859., grad_fn=<MseLossBackward>)
output :  tensor([[114276.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(523667.0625, grad_fn=<MseLossBackward>)
output :  tensor([[183798.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(807835.8125, grad_fn=<MseLossBackward>)
output :  tensor([[184839.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(3463146.5000, grad_fn=<MseLossBackward>)
output :  tensor([[165314.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3928e+10, grad_fn=<MseLossBackward>)
output :  tensor([[96743.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4787e+08, grad_fn=<MseLossBackward>)
output :  tensor([[239094.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(8915.4902, grad_fn=<MseLossBackward>)
output :  tensor([[178444.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(5974281.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140602.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(363025.0938, grad_fn=<MseLossBackward>)
output :  tensor([[236119.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1254225., grad_fn=<MseLossBackward>)
output :  tensor([[159037.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(15702273., grad_fn=<MseLossBackward>)
output :  tensor([[202471.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5013e+10, grad_fn=<MseLossBackward>)
output :  tensor([[135435.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(190055.1250, grad_fn=<MseLossBackward>)
output :  tensor([[185594.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5669e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137904.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(3627656., grad_fn=<MseLossBackward>)
output :  tensor([[225371.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1297e+08, grad_fn=<MseLossBackward>)
output :  tensor([[227347.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1311e+08, grad_fn=<MseLossBackward>)
output :  tensor([[94233.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(17919612., grad_fn=<MseLossBackward>)
output :  tensor([[161733.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(5285688.5000, grad_fn=<MseLossBackward>)
output :  tensor([[246261.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5529e+10, grad_fn=<MseLossBackward>)
output :  tensor([[146801.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(3245740., grad_fn=<MseLossBackward>)
output :  tensor([[110247.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8703e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166647.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(4612092., grad_fn=<MseLossBackward>)
output :  tensor([[142777.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1495423.2500, grad_fn=<MseLossBackward>)
output :  tensor([[129792.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2534862., grad_fn=<MseLossBackward>)
output :  tensor([[189919.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7722e+09, grad_fn=<MseLossBackward>)
output :  tensor([[122572.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(5275.5254, grad_fn=<MseLossBackward>)
output :  tensor([[153370.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1878612.8750, grad_fn=<MseLossBackward>)
output :  tensor([[170864.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(784608.4375, grad_fn=<MseLossBackward>)
output :  tensor([[152145.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1311669.1250, grad_fn=<MseLossBackward>)
output :  tensor([[160766.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(4553689.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135244.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8880e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129318.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(7189646., grad_fn=<MseLossBackward>)
output :  tensor([[155363.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6775e+08, grad_fn=<MseLossBackward>)
output :  tensor([[144887.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(541673., grad_fn=<MseLossBackward>)
output :  tensor([[160754.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(990211.5625, grad_fn=<MseLossBackward>)
output :  tensor([[141762.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0152e+09, grad_fn=<MseLossBackward>)
output :  tensor([[148968.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(28408.0488, grad_fn=<MseLossBackward>)
output :  tensor([[183747.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(18082028., grad_fn=<MseLossBackward>)
output :  tensor([[167174.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(3330739., grad_fn=<MseLossBackward>)
output :  tensor([[180847.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(718627.0625, grad_fn=<MseLossBackward>)
output :  tensor([[220728.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(530211.5000, grad_fn=<MseLossBackward>)
output :  tensor([[113291.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(29072738., grad_fn=<MseLossBackward>)
output :  tensor([[135373.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0969e+08, grad_fn=<MseLossBackward>)
output :  tensor([[284316.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2834908.7500, grad_fn=<MseLossBackward>)
output :  tensor([[117975.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(3902785.5000, grad_fn=<MseLossBackward>)
output :  tensor([[175136.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0127e+09, grad_fn=<MseLossBackward>)
output :  tensor([[184917.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(6790.7900, grad_fn=<MseLossBackward>)
output :  tensor([[171222.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0386e+08, grad_fn=<MseLossBackward>)
output :  tensor([[247949.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3174e+08, grad_fn=<MseLossBackward>)
output :  tensor([[222603.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(364589.5312, grad_fn=<MseLossBackward>)
output :  tensor([[129681.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6556e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175606.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1107e+08, grad_fn=<MseLossBackward>)
output :  tensor([[124410.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(168715.5625, grad_fn=<MseLossBackward>)
output :  tensor([[180030.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6951e+10, grad_fn=<MseLossBackward>)
output :  tensor([[149059.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(15529018., grad_fn=<MseLossBackward>)
output :  tensor([[155153.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(74877112., grad_fn=<MseLossBackward>)
output :  tensor([[208187.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(3560828., grad_fn=<MseLossBackward>)
output :  tensor([[145919.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8008e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174641.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1844928., grad_fn=<MseLossBackward>)
output :  tensor([[251080.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0765e+08, grad_fn=<MseLossBackward>)
output :  tensor([[146829.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1369192.5000, grad_fn=<MseLossBackward>)
output :  tensor([[204607.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(3774459.7500, grad_fn=<MseLossBackward>)
output :  tensor([[161414.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2143936.5000, grad_fn=<MseLossBackward>)
output :  tensor([[125441.1016]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4018e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137016.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1603824.3750, grad_fn=<MseLossBackward>)
output :  tensor([[183899.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(10031.2744, grad_fn=<MseLossBackward>)
output :  tensor([[194100.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(16815894., grad_fn=<MseLossBackward>)
output :  tensor([[222797.]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3828e+09, grad_fn=<MseLossBackward>)
output :  tensor([[253827.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(10067632., grad_fn=<MseLossBackward>)
output :  tensor([[182836.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8540e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143921.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7480e+09, grad_fn=<MseLossBackward>)
output :  tensor([[142615.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(3551163.5000, grad_fn=<MseLossBackward>)
output :  tensor([[72119.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0316e+09, grad_fn=<MseLossBackward>)
output :  tensor([[133959.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1082445.1250, grad_fn=<MseLossBackward>)
output :  tensor([[129630.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(533322.1250, grad_fn=<MseLossBackward>)
output :  tensor([[153770.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(52483.9453, grad_fn=<MseLossBackward>)
output :  tensor([[127964.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(929973.9375, grad_fn=<MseLossBackward>)
output :  tensor([[77895.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1946461., grad_fn=<MseLossBackward>)
output :  tensor([[85519.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(12389410., grad_fn=<MseLossBackward>)
output :  tensor([[226761.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(27446630., grad_fn=<MseLossBackward>)
output :  tensor([[140262.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7077e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129508.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(982932.8125, grad_fn=<MseLossBackward>)
output :  tensor([[167806.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(650165.0625, grad_fn=<MseLossBackward>)
output :  tensor([[239903.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(24042780., grad_fn=<MseLossBackward>)
output :  tensor([[190562.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2489541.5000, grad_fn=<MseLossBackward>)
output :  tensor([[155125.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(764395., grad_fn=<MseLossBackward>)
output :  tensor([[196601.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1687279.2500, grad_fn=<MseLossBackward>)
output :  tensor([[197320.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5744e+09, grad_fn=<MseLossBackward>)
output :  tensor([[138237.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1532141.1250, grad_fn=<MseLossBackward>)
output :  tensor([[155675.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(456025.8750, grad_fn=<MseLossBackward>)
output :  tensor([[136038.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1475.0400, grad_fn=<MseLossBackward>)
output :  tensor([[197124.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0808e+09, grad_fn=<MseLossBackward>)
output :  tensor([[153707.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(85400.9297, grad_fn=<MseLossBackward>)
output :  tensor([[136724.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8683e+09, grad_fn=<MseLossBackward>)
output :  tensor([[149657.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(22630832., grad_fn=<MseLossBackward>)
output :  tensor([[208003.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(15969639., grad_fn=<MseLossBackward>)
output :  tensor([[103580.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6574e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166626.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(762374.5625, grad_fn=<MseLossBackward>)
output :  tensor([[126956.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(1089006.3750, grad_fn=<MseLossBackward>)
output :  tensor([[145575.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2029645.3750, grad_fn=<MseLossBackward>)
output :  tensor([[104959.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8127e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136906.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(351834.3438, grad_fn=<MseLossBackward>)
output :  tensor([[240443.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(19740944., grad_fn=<MseLossBackward>)
output :  tensor([[143785.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1475541.6250, grad_fn=<MseLossBackward>)
output :  tensor([[137934.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(188573.0625, grad_fn=<MseLossBackward>)
output :  tensor([[165467.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4038e+09, grad_fn=<MseLossBackward>)
output :  tensor([[262267.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4750e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178362.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(11308718., grad_fn=<MseLossBackward>)
output :  tensor([[105609.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(8027881., grad_fn=<MseLossBackward>)
output :  tensor([[200291.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9611e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163554.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(20740196., grad_fn=<MseLossBackward>)
output :  tensor([[162609.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6146e+10, grad_fn=<MseLossBackward>)
output :  tensor([[100447.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(4613233., grad_fn=<MseLossBackward>)
output :  tensor([[122367.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1518902.2500, grad_fn=<MseLossBackward>)
output :  tensor([[156935.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(875657.3125, grad_fn=<MseLossBackward>)
output :  tensor([[142116.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(4479770.5000, grad_fn=<MseLossBackward>)
output :  tensor([[196259.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(13993327., grad_fn=<MseLossBackward>)
output :  tensor([[138910.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(9547134., grad_fn=<MseLossBackward>)
output :  tensor([[259408.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(8243448.5000, grad_fn=<MseLossBackward>)
output :  tensor([[127973.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2231e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161924.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(12782859., grad_fn=<MseLossBackward>)
output :  tensor([[189646.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1315143.1250, grad_fn=<MseLossBackward>)
output :  tensor([[126286.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6526e+08, grad_fn=<MseLossBackward>)
output :  tensor([[254259.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(18147334., grad_fn=<MseLossBackward>)
output :  tensor([[157071.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(8.9573e+08, grad_fn=<MseLossBackward>)
output :  tensor([[242219.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(9801987., grad_fn=<MseLossBackward>)
output :  tensor([[140185.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(14547192., grad_fn=<MseLossBackward>)
output :  tensor([[209611.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(150786.5938, grad_fn=<MseLossBackward>)
output :  tensor([[173830.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2047582.1250, grad_fn=<MseLossBackward>)
output :  tensor([[154335.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(112875., grad_fn=<MseLossBackward>)
output :  tensor([[116715.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1649498.7500, grad_fn=<MseLossBackward>)
output :  tensor([[235560.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6553e+09, grad_fn=<MseLossBackward>)
output :  tensor([[238629.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1879555.3750, grad_fn=<MseLossBackward>)
output :  tensor([[151094.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(5029437., grad_fn=<MseLossBackward>)
output :  tensor([[253930.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(940233.2500, grad_fn=<MseLossBackward>)
output :  tensor([[122740.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(67844048., grad_fn=<MseLossBackward>)
output :  tensor([[177563.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2444239., grad_fn=<MseLossBackward>)
output :  tensor([[164569.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(20882472., grad_fn=<MseLossBackward>)
output :  tensor([[129191.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(3270276.7500, grad_fn=<MseLossBackward>)
output :  tensor([[197954.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6860e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163619.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(144958.6719, grad_fn=<MseLossBackward>)
output :  tensor([[164474.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2175579., grad_fn=<MseLossBackward>)
output :  tensor([[158180.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(32512.5977, grad_fn=<MseLossBackward>)
output :  tensor([[151233.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1779431., grad_fn=<MseLossBackward>)
output :  tensor([[175605.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3700e+09, grad_fn=<MseLossBackward>)
output :  tensor([[160976.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(953277.6250, grad_fn=<MseLossBackward>)
output :  tensor([[374930.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(81720472., grad_fn=<MseLossBackward>)
output :  tensor([[135420.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(70906400., grad_fn=<MseLossBackward>)
output :  tensor([[131128.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0819e+09, grad_fn=<MseLossBackward>)
output :  tensor([[276637.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(20934056., grad_fn=<MseLossBackward>)
output :  tensor([[159262.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(7493906., grad_fn=<MseLossBackward>)
output :  tensor([[134236.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8870e+08, grad_fn=<MseLossBackward>)
output :  tensor([[244301.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5132e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180205.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(86895.9844, grad_fn=<MseLossBackward>)
output :  tensor([[155355.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(11256864., grad_fn=<MseLossBackward>)
output :  tensor([[145323.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(104419.8672, grad_fn=<MseLossBackward>)
output :  tensor([[157067.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0672e+08, grad_fn=<MseLossBackward>)
output :  tensor([[101026.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(1053525.8750, grad_fn=<MseLossBackward>)
output :  tensor([[79121.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6562e+08, grad_fn=<MseLossBackward>)
output :  tensor([[164961.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1497.9319, grad_fn=<MseLossBackward>)
output :  tensor([[187993.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6005e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159998.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3994502., grad_fn=<MseLossBackward>)
output :  tensor([[161119.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(13100893., grad_fn=<MseLossBackward>)
output :  tensor([[137039.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(168343.5312, grad_fn=<MseLossBackward>)
output :  tensor([[206493.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(295800., grad_fn=<MseLossBackward>)
output :  tensor([[138929.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(864173.5625, grad_fn=<MseLossBackward>)
output :  tensor([[181418.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6533e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145978.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(448.9102, grad_fn=<MseLossBackward>)
output :  tensor([[110550.]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5900e+08, grad_fn=<MseLossBackward>)
output :  tensor([[93222.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(604384.7500, grad_fn=<MseLossBackward>)
output :  tensor([[175934.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(872998.2500, grad_fn=<MseLossBackward>)
output :  tensor([[256510.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(15131614., grad_fn=<MseLossBackward>)
output :  tensor([[139262.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(5008504., grad_fn=<MseLossBackward>)
output :  tensor([[156166.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(13904043., grad_fn=<MseLossBackward>)
output :  tensor([[133722.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1495652.6250, grad_fn=<MseLossBackward>)
output :  tensor([[145593.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(15257324., grad_fn=<MseLossBackward>)
output :  tensor([[170632.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(7468093.5000, grad_fn=<MseLossBackward>)
output :  tensor([[127909.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(827588.1875, grad_fn=<MseLossBackward>)
output :  tensor([[173577.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1670e+08, grad_fn=<MseLossBackward>)
output :  tensor([[156172.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(683980.6875, grad_fn=<MseLossBackward>)
output :  tensor([[118367.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(3488402.5000, grad_fn=<MseLossBackward>)
output :  tensor([[159284.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4340e+09, grad_fn=<MseLossBackward>)
output :  tensor([[51326.1836]], grad_fn=<AddmmBackward>)
loss:  tensor(454028.5625, grad_fn=<MseLossBackward>)
output :  tensor([[233029.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3156e+09, grad_fn=<MseLossBackward>)
output :  tensor([[201092.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(8570.7090, grad_fn=<MseLossBackward>)
output :  tensor([[181761.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(10489603., grad_fn=<MseLossBackward>)
output :  tensor([[106102.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(10421.5391, grad_fn=<MseLossBackward>)
output :  tensor([[88782.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3178810.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138353.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2712557.5000, grad_fn=<MseLossBackward>)
output :  tensor([[218408.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7140e+09, grad_fn=<MseLossBackward>)
output :  tensor([[203131.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(19081336., grad_fn=<MseLossBackward>)
output :  tensor([[164973.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(707.2275, grad_fn=<MseLossBackward>)
output :  tensor([[171157.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8064e+09, grad_fn=<MseLossBackward>)
output :  tensor([[190213.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(45428.9258, grad_fn=<MseLossBackward>)
output :  tensor([[87532.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(283972.4062, grad_fn=<MseLossBackward>)
output :  tensor([[140657.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(432552.8438, grad_fn=<MseLossBackward>)
output :  tensor([[114606.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(16864498., grad_fn=<MseLossBackward>)
output :  tensor([[149879.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9375e+08, grad_fn=<MseLossBackward>)
output :  tensor([[170475.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5583e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192669.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5205e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180757.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(573522.2500, grad_fn=<MseLossBackward>)
output :  tensor([[98345.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(3405928., grad_fn=<MseLossBackward>)
output :  tensor([[116156.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(1805769., grad_fn=<MseLossBackward>)
output :  tensor([[159892.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8119e+08, grad_fn=<MseLossBackward>)
output :  tensor([[200506.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(256985.6250, grad_fn=<MseLossBackward>)
output :  tensor([[142815.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1403114.2500, grad_fn=<MseLossBackward>)
train_loss: [2.6382618e+09]
epoch_result tensor([0.])
output :  tensor([[156047.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(6015752.5000, grad_fn=<MseLossBackward>)
output :  tensor([[123500.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2250375., grad_fn=<MseLossBackward>)
output :  tensor([[194222.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(443.6289, grad_fn=<MseLossBackward>)
output :  tensor([[176956.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1903.1406, grad_fn=<MseLossBackward>)
output :  tensor([[154484.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5299e+08, grad_fn=<MseLossBackward>)
output :  tensor([[132274.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(18268412., grad_fn=<MseLossBackward>)
output :  tensor([[140782.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(47299.4531, grad_fn=<MseLossBackward>)
output :  tensor([[119810.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(657454.9375, grad_fn=<MseLossBackward>)
output :  tensor([[69750.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2658e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165158.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(708411.5625, grad_fn=<MseLossBackward>)
output :  tensor([[131935.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(65029356., grad_fn=<MseLossBackward>)
output :  tensor([[224034.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(931255.1875, grad_fn=<MseLossBackward>)
output :  tensor([[165224.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(14257350., grad_fn=<MseLossBackward>)
output :  tensor([[248987.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(507344.5938, grad_fn=<MseLossBackward>)
output :  tensor([[55880.6602]], grad_fn=<AddmmBackward>)
loss:  tensor(775562.3125, grad_fn=<MseLossBackward>)
output :  tensor([[163608.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6512e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180821.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(33894956., grad_fn=<MseLossBackward>)
output :  tensor([[164070.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(57316020., grad_fn=<MseLossBackward>)
output :  tensor([[274223.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(602903.7500, grad_fn=<MseLossBackward>)
output :  tensor([[194530.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(6096038., grad_fn=<MseLossBackward>)
output :  tensor([[137510.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5619e+10, grad_fn=<MseLossBackward>)
output :  tensor([[194864.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(970502.0625, grad_fn=<MseLossBackward>)
output :  tensor([[178125.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1878e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151110.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(12196.4414, grad_fn=<MseLossBackward>)
output :  tensor([[172326.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(5413693., grad_fn=<MseLossBackward>)
output :  tensor([[85329.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(4901.0938, grad_fn=<MseLossBackward>)
output :  tensor([[168121.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0384e+09, grad_fn=<MseLossBackward>)
output :  tensor([[184749.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(62993.1562, grad_fn=<MseLossBackward>)
output :  tensor([[204450.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6060e+09, grad_fn=<MseLossBackward>)
output :  tensor([[110613.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(376650.7188, grad_fn=<MseLossBackward>)
output :  tensor([[166846.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(17249226., grad_fn=<MseLossBackward>)
output :  tensor([[137104.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(365155.8438, grad_fn=<MseLossBackward>)
output :  tensor([[130089.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(1186686.8750, grad_fn=<MseLossBackward>)
output :  tensor([[120607.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(1227300.5000, grad_fn=<MseLossBackward>)
output :  tensor([[147351.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2120e+08, grad_fn=<MseLossBackward>)
output :  tensor([[169890.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1057e+10, grad_fn=<MseLossBackward>)
output :  tensor([[153214.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(12351271., grad_fn=<MseLossBackward>)
output :  tensor([[180587.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(344935.9688, grad_fn=<MseLossBackward>)
output :  tensor([[139519.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2190446.2500, grad_fn=<MseLossBackward>)
output :  tensor([[103672.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8695e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135745.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2813e+09, grad_fn=<MseLossBackward>)
output :  tensor([[133242.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(3089190.7500, grad_fn=<MseLossBackward>)
output :  tensor([[136573.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(91649208., grad_fn=<MseLossBackward>)
output :  tensor([[226468.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2157502., grad_fn=<MseLossBackward>)
output :  tensor([[131149.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1211513., grad_fn=<MseLossBackward>)
output :  tensor([[151383.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(5680551., grad_fn=<MseLossBackward>)
output :  tensor([[112626.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(392159.7188, grad_fn=<MseLossBackward>)
output :  tensor([[159937.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3886.7432, grad_fn=<MseLossBackward>)
output :  tensor([[142420.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7646e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192090.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(8161.9932, grad_fn=<MseLossBackward>)
output :  tensor([[135983.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2351718., grad_fn=<MseLossBackward>)
output :  tensor([[100887.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(83029680., grad_fn=<MseLossBackward>)
output :  tensor([[233183.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(666723.3125, grad_fn=<MseLossBackward>)
output :  tensor([[163589.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4901e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159993.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(986638.6875, grad_fn=<MseLossBackward>)
output :  tensor([[203188.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8666e+10, grad_fn=<MseLossBackward>)
output :  tensor([[241419.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2674e+10, grad_fn=<MseLossBackward>)
output :  tensor([[142966.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(284955.7812, grad_fn=<MseLossBackward>)
output :  tensor([[131269.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(7456227.5000, grad_fn=<MseLossBackward>)
output :  tensor([[159032.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(16259544., grad_fn=<MseLossBackward>)
output :  tensor([[134717.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(22255838., grad_fn=<MseLossBackward>)
output :  tensor([[181757.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1218e+09, grad_fn=<MseLossBackward>)
output :  tensor([[181760.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(5473552.5000, grad_fn=<MseLossBackward>)
output :  tensor([[164580.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(9489384., grad_fn=<MseLossBackward>)
output :  tensor([[130013.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6865e+08, grad_fn=<MseLossBackward>)
output :  tensor([[142635.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(18347.5488, grad_fn=<MseLossBackward>)
output :  tensor([[141161.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(14735642., grad_fn=<MseLossBackward>)
output :  tensor([[171213.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6885e+09, grad_fn=<MseLossBackward>)
output :  tensor([[191934.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2826e+08, grad_fn=<MseLossBackward>)
output :  tensor([[140413.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(15319151., grad_fn=<MseLossBackward>)
output :  tensor([[170896.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1007200.4375, grad_fn=<MseLossBackward>)
output :  tensor([[177767.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(10450167., grad_fn=<MseLossBackward>)
output :  tensor([[115915.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(837825.5625, grad_fn=<MseLossBackward>)
output :  tensor([[222190.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1418369.3750, grad_fn=<MseLossBackward>)
output :  tensor([[176587.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(47785896., grad_fn=<MseLossBackward>)
output :  tensor([[125282.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(47109.3477, grad_fn=<MseLossBackward>)
output :  tensor([[193554.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(8676154., grad_fn=<MseLossBackward>)
output :  tensor([[175905.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1010559., grad_fn=<MseLossBackward>)
output :  tensor([[208343.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1651e+10, grad_fn=<MseLossBackward>)
output :  tensor([[208841.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4657234., grad_fn=<MseLossBackward>)
output :  tensor([[169602.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4901e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195341.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(707859.3125, grad_fn=<MseLossBackward>)
output :  tensor([[109925.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(9453559., grad_fn=<MseLossBackward>)
output :  tensor([[114665.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(4688070.5000, grad_fn=<MseLossBackward>)
output :  tensor([[109946.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(4216573.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144947.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3431640.5000, grad_fn=<MseLossBackward>)
output :  tensor([[158753.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3815e+10, grad_fn=<MseLossBackward>)
output :  tensor([[182222.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(4937700.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128818.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(1737474.1250, grad_fn=<MseLossBackward>)
output :  tensor([[146535.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2357136.5000, grad_fn=<MseLossBackward>)
output :  tensor([[179641.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0018e+09, grad_fn=<MseLossBackward>)
output :  tensor([[117488.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(346488.5938, grad_fn=<MseLossBackward>)
output :  tensor([[199916.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(8504514., grad_fn=<MseLossBackward>)
output :  tensor([[142655.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(5495874.5000, grad_fn=<MseLossBackward>)
output :  tensor([[209442.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(11955171., grad_fn=<MseLossBackward>)
output :  tensor([[126890.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(792475.5000, grad_fn=<MseLossBackward>)
output :  tensor([[245562.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(7645743.5000, grad_fn=<MseLossBackward>)
output :  tensor([[236512.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3511e+09, grad_fn=<MseLossBackward>)
output :  tensor([[149051.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1157e+08, grad_fn=<MseLossBackward>)
output :  tensor([[86140.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3205e+08, grad_fn=<MseLossBackward>)
output :  tensor([[190243.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1667e+09, grad_fn=<MseLossBackward>)
output :  tensor([[77382.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(13087832., grad_fn=<MseLossBackward>)
output :  tensor([[140453.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(908804.7500, grad_fn=<MseLossBackward>)
output :  tensor([[77679.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(4749096.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144263.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1716141., grad_fn=<MseLossBackward>)
output :  tensor([[175439.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(314440.5625, grad_fn=<MseLossBackward>)
output :  tensor([[152579.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(848010.7500, grad_fn=<MseLossBackward>)
output :  tensor([[108095.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(484198.5312, grad_fn=<MseLossBackward>)
output :  tensor([[203440.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2613e+10, grad_fn=<MseLossBackward>)
output :  tensor([[127948.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(304462.5625, grad_fn=<MseLossBackward>)
output :  tensor([[268012.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4371e+08, grad_fn=<MseLossBackward>)
output :  tensor([[300069.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(98609864., grad_fn=<MseLossBackward>)
output :  tensor([[109850.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(5525548., grad_fn=<MseLossBackward>)
output :  tensor([[170213.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(5230297.5000, grad_fn=<MseLossBackward>)
output :  tensor([[133920.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7189e+08, grad_fn=<MseLossBackward>)
output :  tensor([[139387.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(150010.9688, grad_fn=<MseLossBackward>)
output :  tensor([[129241.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1017482., grad_fn=<MseLossBackward>)
output :  tensor([[127050.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(4203397., grad_fn=<MseLossBackward>)
output :  tensor([[135599.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8120e+08, grad_fn=<MseLossBackward>)
output :  tensor([[227074.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8387e+10, grad_fn=<MseLossBackward>)
output :  tensor([[186386.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3905e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144770.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(758532.1250, grad_fn=<MseLossBackward>)
output :  tensor([[127116.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(146760.8281, grad_fn=<MseLossBackward>)
output :  tensor([[111846.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(356101.2500, grad_fn=<MseLossBackward>)
output :  tensor([[256285.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8162e+09, grad_fn=<MseLossBackward>)
output :  tensor([[138321.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(11035580., grad_fn=<MseLossBackward>)
output :  tensor([[200053.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(8679560., grad_fn=<MseLossBackward>)
output :  tensor([[106084.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1402115., grad_fn=<MseLossBackward>)
output :  tensor([[138390.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2431553., grad_fn=<MseLossBackward>)
output :  tensor([[206798.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1335e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179322.]], grad_fn=<AddmmBackward>)
loss:  tensor(334084., grad_fn=<MseLossBackward>)
output :  tensor([[186386.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1921732.3750, grad_fn=<MseLossBackward>)
output :  tensor([[162919.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1340e+10, grad_fn=<MseLossBackward>)
output :  tensor([[295218.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5826e+09, grad_fn=<MseLossBackward>)
output :  tensor([[200707.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(7879512., grad_fn=<MseLossBackward>)
output :  tensor([[261596.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9956e+10, grad_fn=<MseLossBackward>)
output :  tensor([[218825.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2255e+09, grad_fn=<MseLossBackward>)
output :  tensor([[280801.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3104e+09, grad_fn=<MseLossBackward>)
output :  tensor([[222303.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2878960.5000, grad_fn=<MseLossBackward>)
output :  tensor([[222581.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8703e+10, grad_fn=<MseLossBackward>)
output :  tensor([[202345.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(28576208., grad_fn=<MseLossBackward>)
output :  tensor([[159898.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(9.5473e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131656.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(712283.2500, grad_fn=<MseLossBackward>)
output :  tensor([[133355.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(4598679., grad_fn=<MseLossBackward>)
output :  tensor([[92175.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1380955.5000, grad_fn=<MseLossBackward>)
output :  tensor([[108123.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(15229.1025, grad_fn=<MseLossBackward>)
output :  tensor([[271162.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3337e+09, grad_fn=<MseLossBackward>)
output :  tensor([[235960.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(923310.8125, grad_fn=<MseLossBackward>)
output :  tensor([[145803.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(645562.0625, grad_fn=<MseLossBackward>)
output :  tensor([[134732.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(7660267., grad_fn=<MseLossBackward>)
output :  tensor([[170469.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(10652676., grad_fn=<MseLossBackward>)
output :  tensor([[151110.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(34350040., grad_fn=<MseLossBackward>)
output :  tensor([[164067.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2613e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165514.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(264276.3125, grad_fn=<MseLossBackward>)
output :  tensor([[136371.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(395483.7500, grad_fn=<MseLossBackward>)
output :  tensor([[190161.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5781e+09, grad_fn=<MseLossBackward>)
output :  tensor([[114515.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(6327622.5000, grad_fn=<MseLossBackward>)
output :  tensor([[168973.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(9161972., grad_fn=<MseLossBackward>)
output :  tensor([[124296.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(18462464., grad_fn=<MseLossBackward>)
output :  tensor([[89344.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(5496424., grad_fn=<MseLossBackward>)
output :  tensor([[180001.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1174, grad_fn=<MseLossBackward>)
output :  tensor([[112146.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(5047780., grad_fn=<MseLossBackward>)
output :  tensor([[242177.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(10097599., grad_fn=<MseLossBackward>)
output :  tensor([[247117.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(4484071., grad_fn=<MseLossBackward>)
output :  tensor([[131690.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(4796237., grad_fn=<MseLossBackward>)
output :  tensor([[107477.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2195999.7500, grad_fn=<MseLossBackward>)
output :  tensor([[287307.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2454e+10, grad_fn=<MseLossBackward>)
output :  tensor([[174654.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(9952842., grad_fn=<MseLossBackward>)
output :  tensor([[124209.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(624877.8750, grad_fn=<MseLossBackward>)
output :  tensor([[144705.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1316e+08, grad_fn=<MseLossBackward>)
output :  tensor([[198943.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2671e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137819.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(10114189., grad_fn=<MseLossBackward>)
output :  tensor([[156943.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5143e+10, grad_fn=<MseLossBackward>)
output :  tensor([[154783.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(779854.5625, grad_fn=<MseLossBackward>)
output :  tensor([[130436.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(877837.2500, grad_fn=<MseLossBackward>)
output :  tensor([[243239.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8295e+10, grad_fn=<MseLossBackward>)
output :  tensor([[403786.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3191582.2500, grad_fn=<MseLossBackward>)
output :  tensor([[111548.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(6495250.5000, grad_fn=<MseLossBackward>)
output :  tensor([[118842.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(117354.4219, grad_fn=<MseLossBackward>)
output :  tensor([[155399.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(16812306., grad_fn=<MseLossBackward>)
output :  tensor([[132336.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6930e+08, grad_fn=<MseLossBackward>)
output :  tensor([[160912.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7317e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173694.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0570e+09, grad_fn=<MseLossBackward>)
output :  tensor([[103294.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(93626.4375, grad_fn=<MseLossBackward>)
output :  tensor([[138024.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(8853507., grad_fn=<MseLossBackward>)
output :  tensor([[365790.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2259666.5000, grad_fn=<MseLossBackward>)
output :  tensor([[202350.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6677e+09, grad_fn=<MseLossBackward>)
output :  tensor([[171192.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(18552672., grad_fn=<MseLossBackward>)
output :  tensor([[205036.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(4566101., grad_fn=<MseLossBackward>)
output :  tensor([[135686.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(10977004., grad_fn=<MseLossBackward>)
output :  tensor([[194791.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(85008.6875, grad_fn=<MseLossBackward>)
output :  tensor([[135720.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9639e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181197.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(39160.6992, grad_fn=<MseLossBackward>)
output :  tensor([[239958.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(4169317.2500, grad_fn=<MseLossBackward>)
output :  tensor([[169395.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(21202572., grad_fn=<MseLossBackward>)
output :  tensor([[109767.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(3123531.5000, grad_fn=<MseLossBackward>)
output :  tensor([[264224.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(113001.0234, grad_fn=<MseLossBackward>)
output :  tensor([[248935.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1133526.2500, grad_fn=<MseLossBackward>)
output :  tensor([[118882.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(16954450., grad_fn=<MseLossBackward>)
output :  tensor([[213838.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7408e+09, grad_fn=<MseLossBackward>)
output :  tensor([[302572.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1654e+08, grad_fn=<MseLossBackward>)
output :  tensor([[209078.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(4318928., grad_fn=<MseLossBackward>)
output :  tensor([[211844.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6424e+10, grad_fn=<MseLossBackward>)
output :  tensor([[157480.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(176045.7969, grad_fn=<MseLossBackward>)
output :  tensor([[170377.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(150132.0312, grad_fn=<MseLossBackward>)
output :  tensor([[164173.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(52440000., grad_fn=<MseLossBackward>)
output :  tensor([[172656.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(7056577., grad_fn=<MseLossBackward>)
output :  tensor([[232380.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2687e+09, grad_fn=<MseLossBackward>)
output :  tensor([[215791.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8671e+08, grad_fn=<MseLossBackward>)
output :  tensor([[160764.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8946e+08, grad_fn=<MseLossBackward>)
output :  tensor([[126097.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(9593538., grad_fn=<MseLossBackward>)
output :  tensor([[176507.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(242525.4688, grad_fn=<MseLossBackward>)
output :  tensor([[179357.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5032e+09, grad_fn=<MseLossBackward>)
output :  tensor([[203833.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6398e+10, grad_fn=<MseLossBackward>)
output :  tensor([[136120.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2852510., grad_fn=<MseLossBackward>)
output :  tensor([[149104.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5652e+08, grad_fn=<MseLossBackward>)
output :  tensor([[274553.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(5984292., grad_fn=<MseLossBackward>)
output :  tensor([[88580.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(12819029., grad_fn=<MseLossBackward>)
output :  tensor([[234255.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(5036798.5000, grad_fn=<MseLossBackward>)
output :  tensor([[255407.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0727e+11, grad_fn=<MseLossBackward>)
output :  tensor([[169966.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1133.7952, grad_fn=<MseLossBackward>)
output :  tensor([[191303.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9094e+09, grad_fn=<MseLossBackward>)
output :  tensor([[153467.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2348747.7500, grad_fn=<MseLossBackward>)
output :  tensor([[205682.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1367e+09, grad_fn=<MseLossBackward>)
output :  tensor([[128524.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(226330.6250, grad_fn=<MseLossBackward>)
output :  tensor([[148114.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(9701278., grad_fn=<MseLossBackward>)
output :  tensor([[170866.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0466e+08, grad_fn=<MseLossBackward>)
output :  tensor([[186384.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(286208.2812, grad_fn=<MseLossBackward>)
output :  tensor([[128407.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(5798276., grad_fn=<MseLossBackward>)
output :  tensor([[136126.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(139782.5156, grad_fn=<MseLossBackward>)
output :  tensor([[173589.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(347436.5625, grad_fn=<MseLossBackward>)
output :  tensor([[200267.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4733e+09, grad_fn=<MseLossBackward>)
output :  tensor([[241102.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(3599676.2500, grad_fn=<MseLossBackward>)
output :  tensor([[154013.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(973459.7500, grad_fn=<MseLossBackward>)
output :  tensor([[200217.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(17788360., grad_fn=<MseLossBackward>)
output :  tensor([[161175.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9500e+08, grad_fn=<MseLossBackward>)
output :  tensor([[187965.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(71664160., grad_fn=<MseLossBackward>)
output :  tensor([[179761.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(19281.9258, grad_fn=<MseLossBackward>)
output :  tensor([[97731.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(535458.0625, grad_fn=<MseLossBackward>)
output :  tensor([[171828.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1701e+10, grad_fn=<MseLossBackward>)
output :  tensor([[132830.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4704832., grad_fn=<MseLossBackward>)
output :  tensor([[119819.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(23228860., grad_fn=<MseLossBackward>)
output :  tensor([[174142.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(20413.2656, grad_fn=<MseLossBackward>)
output :  tensor([[89044.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(16357791., grad_fn=<MseLossBackward>)
output :  tensor([[287544.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(6028406., grad_fn=<MseLossBackward>)
output :  tensor([[166283.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1648615.8750, grad_fn=<MseLossBackward>)
output :  tensor([[191110.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0180e+10, grad_fn=<MseLossBackward>)
output :  tensor([[242050.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3807e+08, grad_fn=<MseLossBackward>)
output :  tensor([[151523.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(273741.5000, grad_fn=<MseLossBackward>)
output :  tensor([[122782.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1482800.8750, grad_fn=<MseLossBackward>)
output :  tensor([[120996.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1203031.8750, grad_fn=<MseLossBackward>)
output :  tensor([[145017.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(9.0103e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175200.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1440562.5000, grad_fn=<MseLossBackward>)
output :  tensor([[110113.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6249e+08, grad_fn=<MseLossBackward>)
output :  tensor([[206588.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2413e+10, grad_fn=<MseLossBackward>)
output :  tensor([[236007.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(30172020., grad_fn=<MseLossBackward>)
output :  tensor([[249679.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1174e+10, grad_fn=<MseLossBackward>)
output :  tensor([[220140.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5567e+08, grad_fn=<MseLossBackward>)
output :  tensor([[194460.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4651e+10, grad_fn=<MseLossBackward>)
output :  tensor([[188956.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(2120345.5000, grad_fn=<MseLossBackward>)
output :  tensor([[207812.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7114e+10, grad_fn=<MseLossBackward>)
output :  tensor([[187194.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2143e+10, grad_fn=<MseLossBackward>)
output :  tensor([[183354.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(21297216., grad_fn=<MseLossBackward>)
output :  tensor([[152332.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(110410.8281, grad_fn=<MseLossBackward>)
output :  tensor([[333889.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(9675988., grad_fn=<MseLossBackward>)
output :  tensor([[208761.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(10487376., grad_fn=<MseLossBackward>)
output :  tensor([[160092.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(8596.7666, grad_fn=<MseLossBackward>)
output :  tensor([[184939.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1991e+09, grad_fn=<MseLossBackward>)
output :  tensor([[103898.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(1212906.3750, grad_fn=<MseLossBackward>)
output :  tensor([[268959.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1819e+10, grad_fn=<MseLossBackward>)
output :  tensor([[172946.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(909817.8750, grad_fn=<MseLossBackward>)
output :  tensor([[215488.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(3954318.7500, grad_fn=<MseLossBackward>)
output :  tensor([[205868.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2896e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179922.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(522074., grad_fn=<MseLossBackward>)
output :  tensor([[203370.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2466519.2500, grad_fn=<MseLossBackward>)
output :  tensor([[154214.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(617378.5000, grad_fn=<MseLossBackward>)
output :  tensor([[149966.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4966e+09, grad_fn=<MseLossBackward>)
output :  tensor([[117401.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(1207200., grad_fn=<MseLossBackward>)
output :  tensor([[139677.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(103734.3203, grad_fn=<MseLossBackward>)
output :  tensor([[144822.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(17453986., grad_fn=<MseLossBackward>)
output :  tensor([[200970.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6137e+10, grad_fn=<MseLossBackward>)
output :  tensor([[160599.]], grad_fn=<AddmmBackward>)
loss:  tensor(1207801., grad_fn=<MseLossBackward>)
output :  tensor([[100572.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1149519., grad_fn=<MseLossBackward>)
output :  tensor([[226438.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8391e+08, grad_fn=<MseLossBackward>)
output :  tensor([[188955.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5014e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175453.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1063315.3750, grad_fn=<MseLossBackward>)
output :  tensor([[83827.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(3340984.2500, grad_fn=<MseLossBackward>)
output :  tensor([[130694.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(4816104.5000, grad_fn=<MseLossBackward>)
output :  tensor([[212661.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1792837.3750, grad_fn=<MseLossBackward>)
output :  tensor([[143584.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(172341.7344, grad_fn=<MseLossBackward>)
output :  tensor([[130258.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(67028.3984, grad_fn=<MseLossBackward>)
output :  tensor([[146809.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(17719232., grad_fn=<MseLossBackward>)
output :  tensor([[180169.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8207e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145390.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1932447.5000, grad_fn=<MseLossBackward>)
output :  tensor([[160537.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(289091.0312, grad_fn=<MseLossBackward>)
output :  tensor([[214683.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(99895.5000, grad_fn=<MseLossBackward>)
output :  tensor([[136868.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0156e+09, grad_fn=<MseLossBackward>)
output :  tensor([[254216.]], grad_fn=<AddmmBackward>)
loss:  tensor(614656., grad_fn=<MseLossBackward>)
output :  tensor([[157533.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(3866077.5000, grad_fn=<MseLossBackward>)
output :  tensor([[129453.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(909817.8750, grad_fn=<MseLossBackward>)
output :  tensor([[96301.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(1694288.6250, grad_fn=<MseLossBackward>)
output :  tensor([[156469.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1796e+09, grad_fn=<MseLossBackward>)
output :  tensor([[175992.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(15272098., grad_fn=<MseLossBackward>)
output :  tensor([[122495.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(3980960.2500, grad_fn=<MseLossBackward>)
output :  tensor([[188233.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6578e+09, grad_fn=<MseLossBackward>)
output :  tensor([[147307.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5979e+09, grad_fn=<MseLossBackward>)
output :  tensor([[149684.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(46251.8789, grad_fn=<MseLossBackward>)
output :  tensor([[187669.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(6548.3496, grad_fn=<MseLossBackward>)
output :  tensor([[254140.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5160e+09, grad_fn=<MseLossBackward>)
output :  tensor([[90295.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(1450914.3750, grad_fn=<MseLossBackward>)
output :  tensor([[237443.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(6534733.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128619.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(14183.3213, grad_fn=<MseLossBackward>)
output :  tensor([[168355.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(9.5150e+09, grad_fn=<MseLossBackward>)
output :  tensor([[116248.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6403e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175921.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(6130.4004, grad_fn=<MseLossBackward>)
output :  tensor([[166302.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2377e+08, grad_fn=<MseLossBackward>)
output :  tensor([[158150.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6457e+08, grad_fn=<MseLossBackward>)
output :  tensor([[237479.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2313108.2500, grad_fn=<MseLossBackward>)
output :  tensor([[227766.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(9.1408e+08, grad_fn=<MseLossBackward>)
output :  tensor([[126286.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(509662.1250, grad_fn=<MseLossBackward>)
output :  tensor([[121617.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(19207196., grad_fn=<MseLossBackward>)
output :  tensor([[226253.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(557845.6250, grad_fn=<MseLossBackward>)
output :  tensor([[230257.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(14005721., grad_fn=<MseLossBackward>)
output :  tensor([[227479.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(608326.8750, grad_fn=<MseLossBackward>)
output :  tensor([[147612.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(149841.5781, grad_fn=<MseLossBackward>)
output :  tensor([[212321.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(5388709.5000, grad_fn=<MseLossBackward>)
output :  tensor([[134180.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0109e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135829.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(11087131., grad_fn=<MseLossBackward>)
output :  tensor([[310001.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(24983440., grad_fn=<MseLossBackward>)
output :  tensor([[140309.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(476315.6562, grad_fn=<MseLossBackward>)
output :  tensor([[121589.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9800e+09, grad_fn=<MseLossBackward>)
output :  tensor([[108974.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(276248.7812, grad_fn=<MseLossBackward>)
output :  tensor([[156039.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7095e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181596.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(8.6729e+09, grad_fn=<MseLossBackward>)
output :  tensor([[176538.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(12518881., grad_fn=<MseLossBackward>)
output :  tensor([[189602.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2991e+08, grad_fn=<MseLossBackward>)
output :  tensor([[107013.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(49182496., grad_fn=<MseLossBackward>)
output :  tensor([[177487.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2288176.2500, grad_fn=<MseLossBackward>)
output :  tensor([[171856.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(15657107., grad_fn=<MseLossBackward>)
output :  tensor([[138290.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(503412.4375, grad_fn=<MseLossBackward>)
output :  tensor([[259543.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9115e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146329.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7613e+09, grad_fn=<MseLossBackward>)
output :  tensor([[175439.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(5952761.5000, grad_fn=<MseLossBackward>)
output :  tensor([[143864.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(14935809., grad_fn=<MseLossBackward>)
output :  tensor([[197444.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(9338850., grad_fn=<MseLossBackward>)
output :  tensor([[166165.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(14703870., grad_fn=<MseLossBackward>)
output :  tensor([[244240.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(57870.3164, grad_fn=<MseLossBackward>)
output :  tensor([[134185.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(98753.0625, grad_fn=<MseLossBackward>)
output :  tensor([[150680.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1771228.2500, grad_fn=<MseLossBackward>)
output :  tensor([[212065.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(8609090., grad_fn=<MseLossBackward>)
output :  tensor([[162876.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(4510778.5000, grad_fn=<MseLossBackward>)
output :  tensor([[195606.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(43640680., grad_fn=<MseLossBackward>)
output :  tensor([[134398.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0524e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130656.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(2742983., grad_fn=<MseLossBackward>)
output :  tensor([[142950.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(8707479., grad_fn=<MseLossBackward>)
output :  tensor([[199472.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9038e+09, grad_fn=<MseLossBackward>)
output :  tensor([[167083.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7126e+09, grad_fn=<MseLossBackward>)
output :  tensor([[75721.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4715e+08, grad_fn=<MseLossBackward>)
output :  tensor([[95135.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1311e+08, grad_fn=<MseLossBackward>)
output :  tensor([[250398.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(8375417., grad_fn=<MseLossBackward>)
output :  tensor([[202574.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0417e+09, grad_fn=<MseLossBackward>)
output :  tensor([[115275.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(75663.6797, grad_fn=<MseLossBackward>)
output :  tensor([[159237.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9875e+08, grad_fn=<MseLossBackward>)
output :  tensor([[208991.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2118e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181067.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9091e+09, grad_fn=<MseLossBackward>)
output :  tensor([[156969.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(3880469., grad_fn=<MseLossBackward>)
output :  tensor([[169013.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(973613.8750, grad_fn=<MseLossBackward>)
output :  tensor([[114724.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(75878.7266, grad_fn=<MseLossBackward>)
output :  tensor([[164999.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(99989688., grad_fn=<MseLossBackward>)
output :  tensor([[193773.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7229e+08, grad_fn=<MseLossBackward>)
output :  tensor([[215617.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(15074413., grad_fn=<MseLossBackward>)
output :  tensor([[243841.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5116e+11, grad_fn=<MseLossBackward>)
output :  tensor([[144456.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(6471220.5000, grad_fn=<MseLossBackward>)
output :  tensor([[106529.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(3806126.7500, grad_fn=<MseLossBackward>)
output :  tensor([[170570.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2837e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148504.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(3981833.2500, grad_fn=<MseLossBackward>)
output :  tensor([[240695.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(13657067., grad_fn=<MseLossBackward>)
output :  tensor([[116654.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(2736569., grad_fn=<MseLossBackward>)
output :  tensor([[178290.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(21243314., grad_fn=<MseLossBackward>)
output :  tensor([[190829.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(17050964., grad_fn=<MseLossBackward>)
output :  tensor([[166111.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3682e+10, grad_fn=<MseLossBackward>)
output :  tensor([[97100.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5923e+08, grad_fn=<MseLossBackward>)
output :  tensor([[235946.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(9324626., grad_fn=<MseLossBackward>)
output :  tensor([[179769.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(14209012., grad_fn=<MseLossBackward>)
output :  tensor([[141108.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1228841.5000, grad_fn=<MseLossBackward>)
output :  tensor([[237747.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(7548842., grad_fn=<MseLossBackward>)
output :  tensor([[163770.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(593140.6250, grad_fn=<MseLossBackward>)
output :  tensor([[201215.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5323e+10, grad_fn=<MseLossBackward>)
output :  tensor([[137049.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(4202179.5000, grad_fn=<MseLossBackward>)
output :  tensor([[188508.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0268e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135851.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(22038.3301, grad_fn=<MseLossBackward>)
output :  tensor([[226893.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(82926352., grad_fn=<MseLossBackward>)
output :  tensor([[225112.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1937e+08, grad_fn=<MseLossBackward>)
output :  tensor([[91943.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(3777647.7500, grad_fn=<MseLossBackward>)
output :  tensor([[161529.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(4390203.5000, grad_fn=<MseLossBackward>)
output :  tensor([[243183.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6306e+10, grad_fn=<MseLossBackward>)
output :  tensor([[146341.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1800670.5000, grad_fn=<MseLossBackward>)
output :  tensor([[110521.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8941e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163613.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(785632.9375, grad_fn=<MseLossBackward>)
output :  tensor([[149100.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(26010318., grad_fn=<MseLossBackward>)
output :  tensor([[127754.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(198658.2344, grad_fn=<MseLossBackward>)
output :  tensor([[190021.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7580e+09, grad_fn=<MseLossBackward>)
output :  tensor([[122146.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(125249.6328, grad_fn=<MseLossBackward>)
output :  tensor([[154271.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(5159286.5000, grad_fn=<MseLossBackward>)
output :  tensor([[169158.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(6717816., grad_fn=<MseLossBackward>)
output :  tensor([[147739.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(10632389., grad_fn=<MseLossBackward>)
output :  tensor([[162244.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(429721.2188, grad_fn=<MseLossBackward>)
output :  tensor([[134610.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5590e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131217.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(611866.1875, grad_fn=<MseLossBackward>)
output :  tensor([[157099.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2759e+08, grad_fn=<MseLossBackward>)
output :  tensor([[146781.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(6916571.5000, grad_fn=<MseLossBackward>)
output :  tensor([[161433.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(100281.0781, grad_fn=<MseLossBackward>)
output :  tensor([[141640.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0074e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150730.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(3725081., grad_fn=<MseLossBackward>)
output :  tensor([[186505.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2232736.2500, grad_fn=<MseLossBackward>)
output :  tensor([[169864.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(747549.3750, grad_fn=<MseLossBackward>)
output :  tensor([[178511.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2216516.2500, grad_fn=<MseLossBackward>)
output :  tensor([[221918.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3680522.2500, grad_fn=<MseLossBackward>)
output :  tensor([[111191.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(10836390., grad_fn=<MseLossBackward>)
output :  tensor([[139865.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2397e+08, grad_fn=<MseLossBackward>)
output :  tensor([[285914.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(7246.2656, grad_fn=<MseLossBackward>)
output :  tensor([[118857.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(8167628., grad_fn=<MseLossBackward>)
output :  tensor([[176969.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8516e+09, grad_fn=<MseLossBackward>)
output :  tensor([[186394.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1943933., grad_fn=<MseLossBackward>)
output :  tensor([[189580.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(16647548., grad_fn=<MseLossBackward>)
output :  tensor([[251487.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5284e+08, grad_fn=<MseLossBackward>)
output :  tensor([[222851.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(724812.8125, grad_fn=<MseLossBackward>)
output :  tensor([[131159.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3804e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178254.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3781e+08, grad_fn=<MseLossBackward>)
output :  tensor([[122939.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1125356.2500, grad_fn=<MseLossBackward>)
output :  tensor([[182980.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5433e+10, grad_fn=<MseLossBackward>)
output :  tensor([[155115.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(4476332., grad_fn=<MseLossBackward>)
output :  tensor([[155930.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(88933448., grad_fn=<MseLossBackward>)
output :  tensor([[206111.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(35667.8633, grad_fn=<MseLossBackward>)
output :  tensor([[146647.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0015e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176031.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(964.8789, grad_fn=<MseLossBackward>)
output :  tensor([[248965.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(9.3237e+08, grad_fn=<MseLossBackward>)
output :  tensor([[150488.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(6190455., grad_fn=<MseLossBackward>)
output :  tensor([[199271.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(11512979., grad_fn=<MseLossBackward>)
output :  tensor([[161711.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(3104093.5000, grad_fn=<MseLossBackward>)
output :  tensor([[125717.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4226e+09, grad_fn=<MseLossBackward>)
output :  tensor([[134112.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2680638.7500, grad_fn=<MseLossBackward>)
output :  tensor([[184412.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(170478.6719, grad_fn=<MseLossBackward>)
output :  tensor([[197403.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(54817132., grad_fn=<MseLossBackward>)
output :  tensor([[220541.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6866e+09, grad_fn=<MseLossBackward>)
output :  tensor([[254468.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(6410074.5000, grad_fn=<MseLossBackward>)
output :  tensor([[182311.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8684e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144319.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7899e+09, grad_fn=<MseLossBackward>)
output :  tensor([[149595.]], grad_fn=<AddmmBackward>)
loss:  tensor(25959024., grad_fn=<MseLossBackward>)
output :  tensor([[76122.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3049e+09, grad_fn=<MseLossBackward>)
output :  tensor([[141340.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(40207884., grad_fn=<MseLossBackward>)
output :  tensor([[126773.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(4522002., grad_fn=<MseLossBackward>)
output :  tensor([[155068.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1141191.5000, grad_fn=<MseLossBackward>)
output :  tensor([[126632.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(134884.0469, grad_fn=<MseLossBackward>)
output :  tensor([[77478.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(957034.1875, grad_fn=<MseLossBackward>)
output :  tensor([[82521.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(272117.0938, grad_fn=<MseLossBackward>)
output :  tensor([[236927.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(24279178., grad_fn=<MseLossBackward>)
output :  tensor([[140919.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0769e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133781.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(10765269., grad_fn=<MseLossBackward>)
output :  tensor([[170241.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(10506107., grad_fn=<MseLossBackward>)
output :  tensor([[233099.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(3610950., grad_fn=<MseLossBackward>)
output :  tensor([[187648.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(20174696., grad_fn=<MseLossBackward>)
output :  tensor([[157592.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2536305., grad_fn=<MseLossBackward>)
output :  tensor([[201123.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(10392766., grad_fn=<MseLossBackward>)
output :  tensor([[201759.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2419e+09, grad_fn=<MseLossBackward>)
output :  tensor([[135489.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2280855., grad_fn=<MseLossBackward>)
output :  tensor([[156565.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2449274., grad_fn=<MseLossBackward>)
output :  tensor([[132832.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(10032165., grad_fn=<MseLossBackward>)
output :  tensor([[196630.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1135e+09, grad_fn=<MseLossBackward>)
output :  tensor([[156071.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(4290983., grad_fn=<MseLossBackward>)
output :  tensor([[140695.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2274e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146600.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2892019., grad_fn=<MseLossBackward>)
output :  tensor([[209527.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(6115188., grad_fn=<MseLossBackward>)
output :  tensor([[102876.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3584e+08, grad_fn=<MseLossBackward>)
output :  tensor([[169695.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(4821455.5000, grad_fn=<MseLossBackward>)
output :  tensor([[130979.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(8875698., grad_fn=<MseLossBackward>)
output :  tensor([[146833.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(27566.3750, grad_fn=<MseLossBackward>)
output :  tensor([[102640.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6206e+09, grad_fn=<MseLossBackward>)
output :  tensor([[140509.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(9059630., grad_fn=<MseLossBackward>)
output :  tensor([[235260.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(546536.7500, grad_fn=<MseLossBackward>)
output :  tensor([[146335.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1784645.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138945.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2088566.8750, grad_fn=<MseLossBackward>)
output :  tensor([[164996.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3687e+09, grad_fn=<MseLossBackward>)
output :  tensor([[267171.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1725e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173579.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2018042.2500, grad_fn=<MseLossBackward>)
output :  tensor([[105023.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(5050378.5000, grad_fn=<MseLossBackward>)
output :  tensor([[199734.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0474e+09, grad_fn=<MseLossBackward>)
output :  tensor([[162104.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(9638696., grad_fn=<MseLossBackward>)
output :  tensor([[162136.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6350e+10, grad_fn=<MseLossBackward>)
output :  tensor([[100459.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(4664722.5000, grad_fn=<MseLossBackward>)
output :  tensor([[125703.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(4425764., grad_fn=<MseLossBackward>)
output :  tensor([[156884.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(783197.3750, grad_fn=<MseLossBackward>)
output :  tensor([[140645.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(416670.2500, grad_fn=<MseLossBackward>)
output :  tensor([[199521.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(228887.4844, grad_fn=<MseLossBackward>)
output :  tensor([[145528.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(12450312., grad_fn=<MseLossBackward>)
output :  tensor([[267808.]], grad_fn=<AddmmBackward>)
loss:  tensor(30558784., grad_fn=<MseLossBackward>)
output :  tensor([[128334.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2485e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164156.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1804362.5000, grad_fn=<MseLossBackward>)
output :  tensor([[186610.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3569147.5000, grad_fn=<MseLossBackward>)
output :  tensor([[121972.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4335e+08, grad_fn=<MseLossBackward>)
output :  tensor([[250607.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(369037.2812, grad_fn=<MseLossBackward>)
output :  tensor([[159048.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8128e+08, grad_fn=<MseLossBackward>)
output :  tensor([[246253.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(816114.6250, grad_fn=<MseLossBackward>)
output :  tensor([[142693.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1706452.3750, grad_fn=<MseLossBackward>)
output :  tensor([[208528.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2165910., grad_fn=<MseLossBackward>)
output :  tensor([[176837.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(19693070., grad_fn=<MseLossBackward>)
output :  tensor([[153413.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(344000.5938, grad_fn=<MseLossBackward>)
output :  tensor([[120378.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(5658711.5000, grad_fn=<MseLossBackward>)
output :  tensor([[237187.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4903e+09, grad_fn=<MseLossBackward>)
output :  tensor([[238603.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1950037.7500, grad_fn=<MseLossBackward>)
output :  tensor([[154185.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(720376.5625, grad_fn=<MseLossBackward>)
output :  tensor([[253809.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1188236.2500, grad_fn=<MseLossBackward>)
output :  tensor([[124166.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(93369944., grad_fn=<MseLossBackward>)
output :  tensor([[176639.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(408480.7500, grad_fn=<MseLossBackward>)
output :  tensor([[157615.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(5685244., grad_fn=<MseLossBackward>)
output :  tensor([[136795.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(33590536., grad_fn=<MseLossBackward>)
output :  tensor([[197578.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6346e+09, grad_fn=<MseLossBackward>)
output :  tensor([[167070.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(9425763., grad_fn=<MseLossBackward>)
output :  tensor([[165240.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(5020820.5000, grad_fn=<MseLossBackward>)
output :  tensor([[158016.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(274.8342, grad_fn=<MseLossBackward>)
output :  tensor([[145336.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(20821112., grad_fn=<MseLossBackward>)
output :  tensor([[174581.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2356e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159311.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(473645.0625, grad_fn=<MseLossBackward>)
output :  tensor([[371769.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4884e+08, grad_fn=<MseLossBackward>)
output :  tensor([[123748.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(10571693., grad_fn=<MseLossBackward>)
output :  tensor([[129633.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9478e+09, grad_fn=<MseLossBackward>)
output :  tensor([[276202.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(25104798., grad_fn=<MseLossBackward>)
output :  tensor([[163156.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1337853.6250, grad_fn=<MseLossBackward>)
output :  tensor([[132331.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3999e+08, grad_fn=<MseLossBackward>)
output :  tensor([[227408.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(21081442., grad_fn=<MseLossBackward>)
output :  tensor([[180201.]], grad_fn=<AddmmBackward>)
loss:  tensor(89401., grad_fn=<MseLossBackward>)
output :  tensor([[154541.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(6458190., grad_fn=<MseLossBackward>)
output :  tensor([[144532.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(218556.2500, grad_fn=<MseLossBackward>)
output :  tensor([[155141.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3276e+08, grad_fn=<MseLossBackward>)
output :  tensor([[102633.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(6936022., grad_fn=<MseLossBackward>)
output :  tensor([[78992.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6073e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165518.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(269150.1875, grad_fn=<MseLossBackward>)
output :  tensor([[188333.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5734e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159221.]], grad_fn=<AddmmBackward>)
loss:  tensor(1490841., grad_fn=<MseLossBackward>)
output :  tensor([[157225.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(75436.0547, grad_fn=<MseLossBackward>)
output :  tensor([[141773.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(18688870., grad_fn=<MseLossBackward>)
output :  tensor([[203441.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(6292023.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138239.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(57585., grad_fn=<MseLossBackward>)
output :  tensor([[181345.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6552e+10, grad_fn=<MseLossBackward>)
output :  tensor([[149047.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(9288399., grad_fn=<MseLossBackward>)
output :  tensor([[109367.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9525e+08, grad_fn=<MseLossBackward>)
output :  tensor([[96822.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(7966330., grad_fn=<MseLossBackward>)
output :  tensor([[173913.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1179803.2500, grad_fn=<MseLossBackward>)
output :  tensor([[264671.]], grad_fn=<AddmmBackward>)
loss:  tensor(18241440., grad_fn=<MseLossBackward>)
output :  tensor([[143892.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(5723906.5000, grad_fn=<MseLossBackward>)
output :  tensor([[159276.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(382909.5625, grad_fn=<MseLossBackward>)
output :  tensor([[133576.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1158852.2500, grad_fn=<MseLossBackward>)
output :  tensor([[146978.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(6359932.5000, grad_fn=<MseLossBackward>)
output :  tensor([[170954.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(9331593., grad_fn=<MseLossBackward>)
output :  tensor([[125610.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(1931730.7500, grad_fn=<MseLossBackward>)
output :  tensor([[175289.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(9.1747e+08, grad_fn=<MseLossBackward>)
output :  tensor([[159854.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(8148794.5000, grad_fn=<MseLossBackward>)
output :  tensor([[113334.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(10023210., grad_fn=<MseLossBackward>)
output :  tensor([[160546.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2495e+09, grad_fn=<MseLossBackward>)
output :  tensor([[56489.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(20152524., grad_fn=<MseLossBackward>)
output :  tensor([[234197.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1312e+09, grad_fn=<MseLossBackward>)
output :  tensor([[197380.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(13100215., grad_fn=<MseLossBackward>)
output :  tensor([[185102.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(10451.8672, grad_fn=<MseLossBackward>)
output :  tensor([[105941.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(3467.1855, grad_fn=<MseLossBackward>)
output :  tensor([[89359.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(5569305., grad_fn=<MseLossBackward>)
output :  tensor([[135575.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(19574126., grad_fn=<MseLossBackward>)
output :  tensor([[218917.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6374e+09, grad_fn=<MseLossBackward>)
output :  tensor([[200352.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(51088544., grad_fn=<MseLossBackward>)
output :  tensor([[165317.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(100598., grad_fn=<MseLossBackward>)
output :  tensor([[173680.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3393e+09, grad_fn=<MseLossBackward>)
output :  tensor([[188581.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2011388.7500, grad_fn=<MseLossBackward>)
output :  tensor([[85547.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(2109552., grad_fn=<MseLossBackward>)
output :  tensor([[136828.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(10059205., grad_fn=<MseLossBackward>)
output :  tensor([[111066.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(320939.9688, grad_fn=<MseLossBackward>)
output :  tensor([[150491.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1118e+08, grad_fn=<MseLossBackward>)
output :  tensor([[171562.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6453e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194654.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0703e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179278.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(521058.4062, grad_fn=<MseLossBackward>)
output :  tensor([[98114.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2606206.7500, grad_fn=<MseLossBackward>)
output :  tensor([[119126.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2644587.5000, grad_fn=<MseLossBackward>)
output :  tensor([[159815.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8489e+08, grad_fn=<MseLossBackward>)
output :  tensor([[197475.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(6375388.5000, grad_fn=<MseLossBackward>)
output :  tensor([[146031.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(4126611.2500, grad_fn=<MseLossBackward>)
train_loss: [2.6495852e+09]
epoch_result tensor([0.])
output :  tensor([[158684.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(34069.0859, grad_fn=<MseLossBackward>)
output :  tensor([[120906.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1195947.2500, grad_fn=<MseLossBackward>)
output :  tensor([[192120.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(4329910.5000, grad_fn=<MseLossBackward>)
output :  tensor([[177657.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(432922.8750, grad_fn=<MseLossBackward>)
output :  tensor([[154952.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3120e+08, grad_fn=<MseLossBackward>)
output :  tensor([[126732.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(1607289.1250, grad_fn=<MseLossBackward>)
output :  tensor([[143255.]], grad_fn=<AddmmBackward>)
loss:  tensor(5085025., grad_fn=<MseLossBackward>)
output :  tensor([[119391.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(152966.5469, grad_fn=<MseLossBackward>)
output :  tensor([[69791.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2750e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166303.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(92368.5078, grad_fn=<MseLossBackward>)
output :  tensor([[144411.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(19462710., grad_fn=<MseLossBackward>)
output :  tensor([[226304.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1702861.8750, grad_fn=<MseLossBackward>)
output :  tensor([[167410.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2526907.7500, grad_fn=<MseLossBackward>)
output :  tensor([[248258.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2079183.7500, grad_fn=<MseLossBackward>)
output :  tensor([[51333.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(13440473., grad_fn=<MseLossBackward>)
output :  tensor([[163535.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6235e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173706.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1672333.8750, grad_fn=<MseLossBackward>)
output :  tensor([[164791.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(68749752., grad_fn=<MseLossBackward>)
output :  tensor([[280818.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(33856760., grad_fn=<MseLossBackward>)
output :  tensor([[197847.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(717620.7500, grad_fn=<MseLossBackward>)
output :  tensor([[137970.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5366e+10, grad_fn=<MseLossBackward>)
output :  tensor([[191673.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(4862369.5000, grad_fn=<MseLossBackward>)
output :  tensor([[177129.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2820e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151188.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(35585.2852, grad_fn=<MseLossBackward>)
output :  tensor([[164920.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(25801956., grad_fn=<MseLossBackward>)
output :  tensor([[87709.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(5332419., grad_fn=<MseLossBackward>)
output :  tensor([[166448.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8567e+09, grad_fn=<MseLossBackward>)
output :  tensor([[182319.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(7186420.5000, grad_fn=<MseLossBackward>)
output :  tensor([[203805.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6723e+09, grad_fn=<MseLossBackward>)
output :  tensor([[110457.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(209163.3125, grad_fn=<MseLossBackward>)
output :  tensor([[172802.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(3248555.7500, grad_fn=<MseLossBackward>)
output :  tensor([[135021.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2185407.7500, grad_fn=<MseLossBackward>)
output :  tensor([[127861.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1296858.3750, grad_fn=<MseLossBackward>)
output :  tensor([[120569.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1143897.1250, grad_fn=<MseLossBackward>)
output :  tensor([[146524.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7167e+08, grad_fn=<MseLossBackward>)
output :  tensor([[170916.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0760e+10, grad_fn=<MseLossBackward>)
output :  tensor([[151218.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2304466.2500, grad_fn=<MseLossBackward>)
output :  tensor([[181007.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1014772.9375, grad_fn=<MseLossBackward>)
output :  tensor([[142404.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1973278.6250, grad_fn=<MseLossBackward>)
output :  tensor([[102783.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6341e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133762.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5995e+09, grad_fn=<MseLossBackward>)
output :  tensor([[134097.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(814478.0625, grad_fn=<MseLossBackward>)
output :  tensor([[131882.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(23840790., grad_fn=<MseLossBackward>)
output :  tensor([[223387.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2600861.7500, grad_fn=<MseLossBackward>)
output :  tensor([[131406.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(711729.5000, grad_fn=<MseLossBackward>)
output :  tensor([[146127.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(8253411., grad_fn=<MseLossBackward>)
output :  tensor([[109137.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(8196724.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162605.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(6789526., grad_fn=<MseLossBackward>)
output :  tensor([[143753.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6262e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192005.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(26.2656, grad_fn=<MseLossBackward>)
output :  tensor([[134271.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(31979.4980, grad_fn=<MseLossBackward>)
output :  tensor([[106415.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(12850825., grad_fn=<MseLossBackward>)
output :  tensor([[236197.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4826877.5000, grad_fn=<MseLossBackward>)
output :  tensor([[164106.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4387e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157868.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1279974., grad_fn=<MseLossBackward>)
output :  tensor([[203707.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8491e+10, grad_fn=<MseLossBackward>)
output :  tensor([[242936.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2335e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145462.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(3850302.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139784.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(33462610., grad_fn=<MseLossBackward>)
output :  tensor([[155089.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(8021.4414, grad_fn=<MseLossBackward>)
output :  tensor([[131855.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(3443402.2500, grad_fn=<MseLossBackward>)
output :  tensor([[181942.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0930e+09, grad_fn=<MseLossBackward>)
output :  tensor([[182200.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3608219., grad_fn=<MseLossBackward>)
output :  tensor([[161316.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(33700.9297, grad_fn=<MseLossBackward>)
output :  tensor([[142952.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2242.9104, grad_fn=<MseLossBackward>)
output :  tensor([[142138.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(130512.8516, grad_fn=<MseLossBackward>)
output :  tensor([[145222.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(49374.2305, grad_fn=<MseLossBackward>)
output :  tensor([[172110.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5664e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195205.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7501e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136964.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(216065.1875, grad_fn=<MseLossBackward>)
output :  tensor([[175626.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(13888549., grad_fn=<MseLossBackward>)
output :  tensor([[178643.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(5555080.5000, grad_fn=<MseLossBackward>)
output :  tensor([[116268.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(1608953.5000, grad_fn=<MseLossBackward>)
output :  tensor([[219428.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2471135., grad_fn=<MseLossBackward>)
output :  tensor([[184191.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(477524.1875, grad_fn=<MseLossBackward>)
output :  tensor([[127674.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(4730081.5000, grad_fn=<MseLossBackward>)
output :  tensor([[198991.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(6206716., grad_fn=<MseLossBackward>)
output :  tensor([[172321.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(6646164.5000, grad_fn=<MseLossBackward>)
output :  tensor([[211966.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0375e+10, grad_fn=<MseLossBackward>)
output :  tensor([[207441.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(12661810., grad_fn=<MseLossBackward>)
output :  tensor([[169564.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4872e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192923.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2486732., grad_fn=<MseLossBackward>)
output :  tensor([[112077.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(850098.4375, grad_fn=<MseLossBackward>)
output :  tensor([[112777.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(77023.5938, grad_fn=<MseLossBackward>)
output :  tensor([[113330.]], grad_fn=<AddmmBackward>)
loss:  tensor(1768900., grad_fn=<MseLossBackward>)
output :  tensor([[145677.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1260286.8750, grad_fn=<MseLossBackward>)
output :  tensor([[160736.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3090e+10, grad_fn=<MseLossBackward>)
output :  tensor([[178136.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3471933.5000, grad_fn=<MseLossBackward>)
output :  tensor([[127035.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(215470.0312, grad_fn=<MseLossBackward>)
output :  tensor([[141799.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(10240700., grad_fn=<MseLossBackward>)
output :  tensor([[184366.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4469e+09, grad_fn=<MseLossBackward>)
output :  tensor([[117207.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(94830.3125, grad_fn=<MseLossBackward>)
output :  tensor([[194565.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(5928312., grad_fn=<MseLossBackward>)
output :  tensor([[145946.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(895625.6250, grad_fn=<MseLossBackward>)
output :  tensor([[213346.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(199278.5469, grad_fn=<MseLossBackward>)
output :  tensor([[128681.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(7188934., grad_fn=<MseLossBackward>)
output :  tensor([[244555.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(14229870., grad_fn=<MseLossBackward>)
output :  tensor([[238301.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1807e+09, grad_fn=<MseLossBackward>)
output :  tensor([[147862.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7102e+08, grad_fn=<MseLossBackward>)
output :  tensor([[85484.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9951e+08, grad_fn=<MseLossBackward>)
output :  tensor([[190673.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0940e+09, grad_fn=<MseLossBackward>)
output :  tensor([[83512.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(6311832., grad_fn=<MseLossBackward>)
output :  tensor([[139517.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(295.9475, grad_fn=<MseLossBackward>)
output :  tensor([[74958.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(292807.8125, grad_fn=<MseLossBackward>)
output :  tensor([[143136.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(33551.9375, grad_fn=<MseLossBackward>)
output :  tensor([[176027.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(744.2666, grad_fn=<MseLossBackward>)
output :  tensor([[152723.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(602709.6250, grad_fn=<MseLossBackward>)
output :  tensor([[107823.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(179028.1562, grad_fn=<MseLossBackward>)
output :  tensor([[204370.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2405e+10, grad_fn=<MseLossBackward>)
output :  tensor([[130806.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(5321708.5000, grad_fn=<MseLossBackward>)
output :  tensor([[267319.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6080e+08, grad_fn=<MseLossBackward>)
output :  tensor([[303676.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(39980724., grad_fn=<MseLossBackward>)
output :  tensor([[108933.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(2055706.2500, grad_fn=<MseLossBackward>)
output :  tensor([[170279.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(4928747., grad_fn=<MseLossBackward>)
output :  tensor([[134668.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1122e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130807.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(67114496., grad_fn=<MseLossBackward>)
output :  tensor([[128873.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1893849., grad_fn=<MseLossBackward>)
output :  tensor([[128556.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(12651304., grad_fn=<MseLossBackward>)
output :  tensor([[136442.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2592e+08, grad_fn=<MseLossBackward>)
output :  tensor([[227095.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8379e+10, grad_fn=<MseLossBackward>)
output :  tensor([[186414.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3897e+10, grad_fn=<MseLossBackward>)
output :  tensor([[139461.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(19701808., grad_fn=<MseLossBackward>)
output :  tensor([[130011.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(6309045., grad_fn=<MseLossBackward>)
output :  tensor([[112403.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(1330111.7500, grad_fn=<MseLossBackward>)
output :  tensor([[252474.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3016e+09, grad_fn=<MseLossBackward>)
output :  tensor([[133870.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1276264.5000, grad_fn=<MseLossBackward>)
output :  tensor([[210308.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(53408464., grad_fn=<MseLossBackward>)
output :  tensor([[103655.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(1549499.7500, grad_fn=<MseLossBackward>)
output :  tensor([[140266.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(100142.5781, grad_fn=<MseLossBackward>)
output :  tensor([[204134.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1475e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176790.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(9670934., grad_fn=<MseLossBackward>)
output :  tensor([[185642.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(412284.3750, grad_fn=<MseLossBackward>)
output :  tensor([[162966.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1326e+10, grad_fn=<MseLossBackward>)
output :  tensor([[297429.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4115e+09, grad_fn=<MseLossBackward>)
output :  tensor([[199128.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1509289., grad_fn=<MseLossBackward>)
output :  tensor([[260360.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0306e+10, grad_fn=<MseLossBackward>)
output :  tensor([[218676.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2395e+09, grad_fn=<MseLossBackward>)
output :  tensor([[279116.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4352e+09, grad_fn=<MseLossBackward>)
output :  tensor([[223766.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(54347.2656, grad_fn=<MseLossBackward>)
output :  tensor([[222659.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8676e+10, grad_fn=<MseLossBackward>)
output :  tensor([[193208.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(14377842., grad_fn=<MseLossBackward>)
output :  tensor([[158623.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7757e+08, grad_fn=<MseLossBackward>)
output :  tensor([[139680.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(51564964., grad_fn=<MseLossBackward>)
output :  tensor([[136587.]], grad_fn=<AddmmBackward>)
loss:  tensor(1181569., grad_fn=<MseLossBackward>)
output :  tensor([[90443.]], grad_fn=<AddmmBackward>)
loss:  tensor(310249., grad_fn=<MseLossBackward>)
output :  tensor([[107871.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(16570.5273, grad_fn=<MseLossBackward>)
output :  tensor([[273430.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0769e+09, grad_fn=<MseLossBackward>)
output :  tensor([[232496.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(6268529.5000, grad_fn=<MseLossBackward>)
output :  tensor([[147376.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(5649683.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138851.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1825665.3750, grad_fn=<MseLossBackward>)
output :  tensor([[175956.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(4944299.5000, grad_fn=<MseLossBackward>)
output :  tensor([[147062.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(3285439.5000, grad_fn=<MseLossBackward>)
output :  tensor([[164636.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(8.9183e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166458.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2126447.5000, grad_fn=<MseLossBackward>)
output :  tensor([[137382.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(146258.4375, grad_fn=<MseLossBackward>)
output :  tensor([[189129.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4394e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113807.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(3265898.5000, grad_fn=<MseLossBackward>)
output :  tensor([[175776.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(14264785., grad_fn=<MseLossBackward>)
output :  tensor([[121131.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1279974., grad_fn=<MseLossBackward>)
output :  tensor([[88163.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1354714.1250, grad_fn=<MseLossBackward>)
output :  tensor([[179109.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(793713.9375, grad_fn=<MseLossBackward>)
output :  tensor([[110798.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(807737.5000, grad_fn=<MseLossBackward>)
output :  tensor([[234319.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(21903862., grad_fn=<MseLossBackward>)
output :  tensor([[244102.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(805983.1250, grad_fn=<MseLossBackward>)
output :  tensor([[125778.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(13849911., grad_fn=<MseLossBackward>)
output :  tensor([[110702.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(3040827.5000, grad_fn=<MseLossBackward>)
output :  tensor([[287189.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2489e+10, grad_fn=<MseLossBackward>)
output :  tensor([[173533.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4133152.5000, grad_fn=<MseLossBackward>)
output :  tensor([[127245.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(5040796.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144751.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1562e+08, grad_fn=<MseLossBackward>)
output :  tensor([[200054.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9447e+08, grad_fn=<MseLossBackward>)
output :  tensor([[139466.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2351622.2500, grad_fn=<MseLossBackward>)
output :  tensor([[156083.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5355e+10, grad_fn=<MseLossBackward>)
output :  tensor([[148023.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(34532700., grad_fn=<MseLossBackward>)
output :  tensor([[131094.]], grad_fn=<AddmmBackward>)
loss:  tensor(2540836., grad_fn=<MseLossBackward>)
output :  tensor([[244379.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7988e+10, grad_fn=<MseLossBackward>)
output :  tensor([[390355.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3558e+08, grad_fn=<MseLossBackward>)
output :  tensor([[110666.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(2776935.7500, grad_fn=<MseLossBackward>)
output :  tensor([[113488.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(25111060., grad_fn=<MseLossBackward>)
output :  tensor([[160374.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(764395., grad_fn=<MseLossBackward>)
output :  tensor([[132198.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7531e+08, grad_fn=<MseLossBackward>)
output :  tensor([[161877.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6147e+09, grad_fn=<MseLossBackward>)
output :  tensor([[171813.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8210e+09, grad_fn=<MseLossBackward>)
output :  tensor([[105607.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(4029774., grad_fn=<MseLossBackward>)
output :  tensor([[139171.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3343526.5000, grad_fn=<MseLossBackward>)
output :  tensor([[363346.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(15583990., grad_fn=<MseLossBackward>)
output :  tensor([[202069.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6968e+09, grad_fn=<MseLossBackward>)
output :  tensor([[178181.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(7191196.5000, grad_fn=<MseLossBackward>)
output :  tensor([[200544.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(5547497., grad_fn=<MseLossBackward>)
output :  tensor([[140616.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2613476.5000, grad_fn=<MseLossBackward>)
output :  tensor([[197319.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(7948347., grad_fn=<MseLossBackward>)
output :  tensor([[136245.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2631e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179871.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1272560.2500, grad_fn=<MseLossBackward>)
output :  tensor([[244458.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(6042532., grad_fn=<MseLossBackward>)
output :  tensor([[174484.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(234558.5938, grad_fn=<MseLossBackward>)
output :  tensor([[109020.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1041197., grad_fn=<MseLossBackward>)
output :  tensor([[265432.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(758749.8750, grad_fn=<MseLossBackward>)
output :  tensor([[251624.]], grad_fn=<AddmmBackward>)
loss:  tensor(2637376., grad_fn=<MseLossBackward>)
output :  tensor([[120172.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(7994756., grad_fn=<MseLossBackward>)
output :  tensor([[213433.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7904e+09, grad_fn=<MseLossBackward>)
output :  tensor([[302302.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2888e+08, grad_fn=<MseLossBackward>)
output :  tensor([[207078.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(6137.7432, grad_fn=<MseLossBackward>)
output :  tensor([[213692.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5954e+10, grad_fn=<MseLossBackward>)
output :  tensor([[159218.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1739307.6250, grad_fn=<MseLossBackward>)
output :  tensor([[167676.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(5352210., grad_fn=<MseLossBackward>)
output :  tensor([[160190.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(10616600., grad_fn=<MseLossBackward>)
output :  tensor([[172441.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(5962219.5000, grad_fn=<MseLossBackward>)
output :  tensor([[234207.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1420e+09, grad_fn=<MseLossBackward>)
output :  tensor([[214165.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3379e+08, grad_fn=<MseLossBackward>)
output :  tensor([[160893.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9302e+08, grad_fn=<MseLossBackward>)
output :  tensor([[120221.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(7717588., grad_fn=<MseLossBackward>)
output :  tensor([[175472.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2332301.7500, grad_fn=<MseLossBackward>)
output :  tensor([[179332.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5073e+09, grad_fn=<MseLossBackward>)
output :  tensor([[204620.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6099e+10, grad_fn=<MseLossBackward>)
output :  tensor([[133907.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(275346.1562, grad_fn=<MseLossBackward>)
output :  tensor([[151307.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8252e+08, grad_fn=<MseLossBackward>)
output :  tensor([[276430.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(324081.1562, grad_fn=<MseLossBackward>)
output :  tensor([[84760.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(57150.8789, grad_fn=<MseLossBackward>)
output :  tensor([[234887.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2600257., grad_fn=<MseLossBackward>)
output :  tensor([[256686.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0644e+11, grad_fn=<MseLossBackward>)
output :  tensor([[170600.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(360356.3438, grad_fn=<MseLossBackward>)
output :  tensor([[192315.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8219e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151922.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(9468025., grad_fn=<MseLossBackward>)
output :  tensor([[204816.]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2490e+09, grad_fn=<MseLossBackward>)
output :  tensor([[128554.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(198762.7188, grad_fn=<MseLossBackward>)
output :  tensor([[147184.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(4771426., grad_fn=<MseLossBackward>)
output :  tensor([[169814.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4611e+08, grad_fn=<MseLossBackward>)
output :  tensor([[186601.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(565151.5625, grad_fn=<MseLossBackward>)
output :  tensor([[127933.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(3740265.2500, grad_fn=<MseLossBackward>)
output :  tensor([[138289.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(3200744.7500, grad_fn=<MseLossBackward>)
output :  tensor([[168340.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(21708464., grad_fn=<MseLossBackward>)
output :  tensor([[200100.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4900e+09, grad_fn=<MseLossBackward>)
output :  tensor([[239055.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(15556615., grad_fn=<MseLossBackward>)
output :  tensor([[153459.]], grad_fn=<AddmmBackward>)
loss:  tensor(2374681., grad_fn=<MseLossBackward>)
output :  tensor([[196236.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(55932.2500, grad_fn=<MseLossBackward>)
output :  tensor([[162200.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3126e+08, grad_fn=<MseLossBackward>)
output :  tensor([[187167.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(58797264., grad_fn=<MseLossBackward>)
output :  tensor([[177634.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(5131499., grad_fn=<MseLossBackward>)
output :  tensor([[96932.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(4562.5801, grad_fn=<MseLossBackward>)
output :  tensor([[171310.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1813e+10, grad_fn=<MseLossBackward>)
output :  tensor([[133688.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1720196.2500, grad_fn=<MseLossBackward>)
output :  tensor([[121641.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(44115128., grad_fn=<MseLossBackward>)
output :  tensor([[172430.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2461957.2500, grad_fn=<MseLossBackward>)
output :  tensor([[85614.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(377255.0625, grad_fn=<MseLossBackward>)
output :  tensor([[288535.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2146133.5000, grad_fn=<MseLossBackward>)
output :  tensor([[168428.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(11753005., grad_fn=<MseLossBackward>)
output :  tensor([[190844.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0256e+10, grad_fn=<MseLossBackward>)
output :  tensor([[243069.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8013e+08, grad_fn=<MseLossBackward>)
output :  tensor([[149782.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1482991.1250, grad_fn=<MseLossBackward>)
output :  tensor([[123743.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(66032.9375, grad_fn=<MseLossBackward>)
output :  tensor([[116455.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(11866948., grad_fn=<MseLossBackward>)
output :  tensor([[144646.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7889e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172627.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1883284.5000, grad_fn=<MseLossBackward>)
output :  tensor([[113416.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(9.5584e+08, grad_fn=<MseLossBackward>)
output :  tensor([[208001.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2100e+10, grad_fn=<MseLossBackward>)
output :  tensor([[237381.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(16960240., grad_fn=<MseLossBackward>)
output :  tensor([[248768.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1440e+10, grad_fn=<MseLossBackward>)
output :  tensor([[220991.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2430e+08, grad_fn=<MseLossBackward>)
output :  tensor([[194587.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4620e+10, grad_fn=<MseLossBackward>)
output :  tensor([[187954.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(206186.9375, grad_fn=<MseLossBackward>)
output :  tensor([[206132.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7846e+10, grad_fn=<MseLossBackward>)
output :  tensor([[188509.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1754e+10, grad_fn=<MseLossBackward>)
output :  tensor([[176564.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4734432., grad_fn=<MseLossBackward>)
output :  tensor([[150911.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1184866.2500, grad_fn=<MseLossBackward>)
output :  tensor([[334715.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(5218369., grad_fn=<MseLossBackward>)
output :  tensor([[207623.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(19155394., grad_fn=<MseLossBackward>)
output :  tensor([[159909.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(8261.1055, grad_fn=<MseLossBackward>)
output :  tensor([[185397.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1475e+09, grad_fn=<MseLossBackward>)
output :  tensor([[105528.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(279626.1250, grad_fn=<MseLossBackward>)
output :  tensor([[273282.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9365e+10, grad_fn=<MseLossBackward>)
output :  tensor([[170937.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(8778165., grad_fn=<MseLossBackward>)
output :  tensor([[211501.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3993252.7500, grad_fn=<MseLossBackward>)
output :  tensor([[205545.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3884e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178975.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(50540.6602, grad_fn=<MseLossBackward>)
output :  tensor([[198064.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(13950692., grad_fn=<MseLossBackward>)
output :  tensor([[157267.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(5141343.5000, grad_fn=<MseLossBackward>)
output :  tensor([[148882.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3895e+09, grad_fn=<MseLossBackward>)
output :  tensor([[121767.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(10679620., grad_fn=<MseLossBackward>)
output :  tensor([[139888.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(12460.1406, grad_fn=<MseLossBackward>)
output :  tensor([[149374.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(140460.9844, grad_fn=<MseLossBackward>)
output :  tensor([[199525.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6506e+10, grad_fn=<MseLossBackward>)
output :  tensor([[162014.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(6320589., grad_fn=<MseLossBackward>)
output :  tensor([[101503.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(4013668., grad_fn=<MseLossBackward>)
output :  tensor([[223779.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6312e+08, grad_fn=<MseLossBackward>)
output :  tensor([[186636.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4674e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177730.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1550958.8750, grad_fn=<MseLossBackward>)
output :  tensor([[82892.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(795942.7500, grad_fn=<MseLossBackward>)
output :  tensor([[131940.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(11834353., grad_fn=<MseLossBackward>)
output :  tensor([[215554.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2416178.7500, grad_fn=<MseLossBackward>)
output :  tensor([[144342.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(117028.1328, grad_fn=<MseLossBackward>)
output :  tensor([[131508.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2276609.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140265.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(5449817.5000, grad_fn=<MseLossBackward>)
output :  tensor([[179803.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7896e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146757.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(7606478., grad_fn=<MseLossBackward>)
output :  tensor([[160030.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(938.8479, grad_fn=<MseLossBackward>)
output :  tensor([[214876.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(15190.5625, grad_fn=<MseLossBackward>)
output :  tensor([[138162.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0997e+09, grad_fn=<MseLossBackward>)
output :  tensor([[254579.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(176728.2812, grad_fn=<MseLossBackward>)
output :  tensor([[161845.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(5499758., grad_fn=<MseLossBackward>)
output :  tensor([[130118.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2619390.5000, grad_fn=<MseLossBackward>)
output :  tensor([[93637.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(1856810.7500, grad_fn=<MseLossBackward>)
output :  tensor([[157780.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3700e+09, grad_fn=<MseLossBackward>)
output :  tensor([[179720.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(32203.4238, grad_fn=<MseLossBackward>)
output :  tensor([[119709.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(625112.6250, grad_fn=<MseLossBackward>)
output :  tensor([[187283.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7361e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144219.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1886e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151796.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(3595586.2500, grad_fn=<MseLossBackward>)
output :  tensor([[186056.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2867360.2500, grad_fn=<MseLossBackward>)
output :  tensor([[252368.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6572e+09, grad_fn=<MseLossBackward>)
output :  tensor([[94079.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(6653175.5000, grad_fn=<MseLossBackward>)
output :  tensor([[239647.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(124487.6875, grad_fn=<MseLossBackward>)
output :  tensor([[126868.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(2661562.7500, grad_fn=<MseLossBackward>)
output :  tensor([[164657.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0250e+10, grad_fn=<MseLossBackward>)
output :  tensor([[113482.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8177e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177941.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3769058.2500, grad_fn=<MseLossBackward>)
output :  tensor([[163609.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8608e+08, grad_fn=<MseLossBackward>)
output :  tensor([[154788.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8994e+08, grad_fn=<MseLossBackward>)
output :  tensor([[237825.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1378642.8750, grad_fn=<MseLossBackward>)
output :  tensor([[226539.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(9.8976e+08, grad_fn=<MseLossBackward>)
output :  tensor([[127806.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(650001.2500, grad_fn=<MseLossBackward>)
output :  tensor([[129462.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(11991828., grad_fn=<MseLossBackward>)
output :  tensor([[224528.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(6106767.5000, grad_fn=<MseLossBackward>)
output :  tensor([[230112.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(15113628., grad_fn=<MseLossBackward>)
output :  tensor([[231058.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(18996522., grad_fn=<MseLossBackward>)
output :  tensor([[147043.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(915729.3750, grad_fn=<MseLossBackward>)
output :  tensor([[214066.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(16535406., grad_fn=<MseLossBackward>)
output :  tensor([[130914.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1912e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135785.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(10796461., grad_fn=<MseLossBackward>)
output :  tensor([[308302.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(44853156., grad_fn=<MseLossBackward>)
output :  tensor([[142977.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(3912360.5000, grad_fn=<MseLossBackward>)
output :  tensor([[120827.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8974e+09, grad_fn=<MseLossBackward>)
output :  tensor([[107741.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(3092377.2500, grad_fn=<MseLossBackward>)
output :  tensor([[155067.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0389e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178298.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2982e+09, grad_fn=<MseLossBackward>)
output :  tensor([[171800.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1439100.1250, grad_fn=<MseLossBackward>)
output :  tensor([[191603.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(88301256., grad_fn=<MseLossBackward>)
output :  tensor([[97778.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(4934819.5000, grad_fn=<MseLossBackward>)
output :  tensor([[178748.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(63126.5625, grad_fn=<MseLossBackward>)
output :  tensor([[168829.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(863070.0625, grad_fn=<MseLossBackward>)
output :  tensor([[142171.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(10057223., grad_fn=<MseLossBackward>)
output :  tensor([[263269.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(9.1834e+09, grad_fn=<MseLossBackward>)
output :  tensor([[141650.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2093e+09, grad_fn=<MseLossBackward>)
output :  tensor([[176293.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(10849921., grad_fn=<MseLossBackward>)
output :  tensor([[138492.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2272839., grad_fn=<MseLossBackward>)
output :  tensor([[201431.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(868128.9375, grad_fn=<MseLossBackward>)
output :  tensor([[168686.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1724379.3750, grad_fn=<MseLossBackward>)
output :  tensor([[241808.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(4803973.5000, grad_fn=<MseLossBackward>)
output :  tensor([[134820.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(102420., grad_fn=<MseLossBackward>)
output :  tensor([[150589.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1536437.7500, grad_fn=<MseLossBackward>)
output :  tensor([[213355.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2704842.7500, grad_fn=<MseLossBackward>)
output :  tensor([[164594.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(164303.5625, grad_fn=<MseLossBackward>)
output :  tensor([[187065.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3743136.7500, grad_fn=<MseLossBackward>)
output :  tensor([[133558.]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4730e+08, grad_fn=<MseLossBackward>)
output :  tensor([[127247.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(3070462.2500, grad_fn=<MseLossBackward>)
output :  tensor([[140558.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(312306.3438, grad_fn=<MseLossBackward>)
output :  tensor([[200041.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8245e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166173.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6187e+09, grad_fn=<MseLossBackward>)
output :  tensor([[78071.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2658e+08, grad_fn=<MseLossBackward>)
output :  tensor([[94469.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(99386104., grad_fn=<MseLossBackward>)
output :  tensor([[256035.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(7523877.5000, grad_fn=<MseLossBackward>)
output :  tensor([[203144.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1145e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113208.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(3209248.2500, grad_fn=<MseLossBackward>)
output :  tensor([[156698.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(9.4874e+08, grad_fn=<MseLossBackward>)
output :  tensor([[204097.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5289e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178818.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3141e+09, grad_fn=<MseLossBackward>)
output :  tensor([[156849.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(3420997., grad_fn=<MseLossBackward>)
output :  tensor([[169593.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(164861.3750, grad_fn=<MseLossBackward>)
output :  tensor([[115524.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(275051.0938, grad_fn=<MseLossBackward>)
output :  tensor([[164006.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(81114512., grad_fn=<MseLossBackward>)
output :  tensor([[192973.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9396e+08, grad_fn=<MseLossBackward>)
output :  tensor([[219739.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(57420.1406, grad_fn=<MseLossBackward>)
output :  tensor([[243216.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5179e+11, grad_fn=<MseLossBackward>)
output :  tensor([[146938.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3730.5374, grad_fn=<MseLossBackward>)
output :  tensor([[111420.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(8647965., grad_fn=<MseLossBackward>)
output :  tensor([[167635.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0348e+08, grad_fn=<MseLossBackward>)
output :  tensor([[155408.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(24091378., grad_fn=<MseLossBackward>)
output :  tensor([[233734.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(10662878., grad_fn=<MseLossBackward>)
output :  tensor([[117686.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(7218457.5000, grad_fn=<MseLossBackward>)
output :  tensor([[186245.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(11192161., grad_fn=<MseLossBackward>)
output :  tensor([[185745.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(911607.2500, grad_fn=<MseLossBackward>)
output :  tensor([[163768.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4408e+10, grad_fn=<MseLossBackward>)
output :  tensor([[94601.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8500e+08, grad_fn=<MseLossBackward>)
output :  tensor([[236772.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(4962243.5000, grad_fn=<MseLossBackward>)
output :  tensor([[175080.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(846026.3125, grad_fn=<MseLossBackward>)
output :  tensor([[139678.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(103553.2266, grad_fn=<MseLossBackward>)
output :  tensor([[233874.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1266996.5000, grad_fn=<MseLossBackward>)
output :  tensor([[159977.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(9134278., grad_fn=<MseLossBackward>)
output :  tensor([[201755.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5189e+10, grad_fn=<MseLossBackward>)
output :  tensor([[133699.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1691300.2500, grad_fn=<MseLossBackward>)
output :  tensor([[186198.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8557e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136551.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(304083.3125, grad_fn=<MseLossBackward>)
output :  tensor([[223830.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4810e+08, grad_fn=<MseLossBackward>)
output :  tensor([[224306.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6015e+08, grad_fn=<MseLossBackward>)
output :  tensor([[92980.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(8883427., grad_fn=<MseLossBackward>)
output :  tensor([[160164.]], grad_fn=<AddmmBackward>)
loss:  tensor(532900., grad_fn=<MseLossBackward>)
output :  tensor([[245783.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5649e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145353.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(125006.4375, grad_fn=<MseLossBackward>)
output :  tensor([[110773.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9161e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164254.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(60224.2266, grad_fn=<MseLossBackward>)
output :  tensor([[147818.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(14578675., grad_fn=<MseLossBackward>)
output :  tensor([[128452.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(63728.6367, grad_fn=<MseLossBackward>)
output :  tensor([[189777.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7918e+09, grad_fn=<MseLossBackward>)
output :  tensor([[125322.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(7966021., grad_fn=<MseLossBackward>)
output :  tensor([[150005.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(3976534.5000, grad_fn=<MseLossBackward>)
output :  tensor([[171522.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(51578.6680, grad_fn=<MseLossBackward>)
output :  tensor([[150090.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(826678.7500, grad_fn=<MseLossBackward>)
output :  tensor([[158836.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(16508731., grad_fn=<MseLossBackward>)
output :  tensor([[135556.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0527e+08, grad_fn=<MseLossBackward>)
output :  tensor([[132680.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(462867.6250, grad_fn=<MseLossBackward>)
output :  tensor([[154989.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5568e+08, grad_fn=<MseLossBackward>)
output :  tensor([[145293.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1303272., grad_fn=<MseLossBackward>)
output :  tensor([[164208.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(6043377., grad_fn=<MseLossBackward>)
output :  tensor([[142903.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0892e+09, grad_fn=<MseLossBackward>)
output :  tensor([[148611.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(35502.8047, grad_fn=<MseLossBackward>)
output :  tensor([[185945.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(4221419.5000, grad_fn=<MseLossBackward>)
output :  tensor([[170401.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1965472.6250, grad_fn=<MseLossBackward>)
output :  tensor([[180673.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(454212.8125, grad_fn=<MseLossBackward>)
output :  tensor([[218738.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1590475.6250, grad_fn=<MseLossBackward>)
output :  tensor([[110252.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(5532859.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139671.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1820e+08, grad_fn=<MseLossBackward>)
output :  tensor([[291225.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(27302584., grad_fn=<MseLossBackward>)
output :  tensor([[116885.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(783390.9375, grad_fn=<MseLossBackward>)
output :  tensor([[177878.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7742e+09, grad_fn=<MseLossBackward>)
output :  tensor([[190376.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(28911792., grad_fn=<MseLossBackward>)
output :  tensor([[172719.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6334e+08, grad_fn=<MseLossBackward>)
output :  tensor([[251695.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4309e+08, grad_fn=<MseLossBackward>)
output :  tensor([[219831.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(4703544.5000, grad_fn=<MseLossBackward>)
output :  tensor([[133694.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7253e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175620.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1168e+08, grad_fn=<MseLossBackward>)
output :  tensor([[127528.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(12447335., grad_fn=<MseLossBackward>)
output :  tensor([[184893.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4459e+10, grad_fn=<MseLossBackward>)
output :  tensor([[151406.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2539043., grad_fn=<MseLossBackward>)
output :  tensor([[156219.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(94476880., grad_fn=<MseLossBackward>)
output :  tensor([[204910.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1930145.7500, grad_fn=<MseLossBackward>)
output :  tensor([[146105.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8510e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173780.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(4925764., grad_fn=<MseLossBackward>)
output :  tensor([[249323.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(9.1063e+08, grad_fn=<MseLossBackward>)
output :  tensor([[145863.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(4564498.5000, grad_fn=<MseLossBackward>)
output :  tensor([[203757.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1193317.2500, grad_fn=<MseLossBackward>)
output :  tensor([[160191.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(58435.5078, grad_fn=<MseLossBackward>)
output :  tensor([[126926.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5153e+09, grad_fn=<MseLossBackward>)
output :  tensor([[138159.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(5806518.5000, grad_fn=<MseLossBackward>)
output :  tensor([[183792.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(43075.7070, grad_fn=<MseLossBackward>)
output :  tensor([[196609.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(43679500., grad_fn=<MseLossBackward>)
output :  tensor([[218876.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9173e+09, grad_fn=<MseLossBackward>)
output :  tensor([[257675.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(456616.9375, grad_fn=<MseLossBackward>)
output :  tensor([[182513.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8628e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144642.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8242e+09, grad_fn=<MseLossBackward>)
output :  tensor([[143097.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1967313., grad_fn=<MseLossBackward>)
output :  tensor([[73165.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1000e+09, grad_fn=<MseLossBackward>)
output :  tensor([[133219.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(3168956.2500, grad_fn=<MseLossBackward>)
output :  tensor([[129157.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(66330.3906, grad_fn=<MseLossBackward>)
output :  tensor([[155466.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2150439., grad_fn=<MseLossBackward>)
output :  tensor([[130613.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(13059133., grad_fn=<MseLossBackward>)
output :  tensor([[74990.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(2278095., grad_fn=<MseLossBackward>)
output :  tensor([[84111.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(4456651., grad_fn=<MseLossBackward>)
output :  tensor([[224809.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(51709584., grad_fn=<MseLossBackward>)
output :  tensor([[141368.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3340e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130009.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(240475.2969, grad_fn=<MseLossBackward>)
output :  tensor([[170281.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(10766807., grad_fn=<MseLossBackward>)
output :  tensor([[236186.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1407708.1250, grad_fn=<MseLossBackward>)
output :  tensor([[191346.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(629270.3750, grad_fn=<MseLossBackward>)
output :  tensor([[156716.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(512700.7500, grad_fn=<MseLossBackward>)
output :  tensor([[197950.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2583.4983, grad_fn=<MseLossBackward>)
output :  tensor([[200600.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3249e+09, grad_fn=<MseLossBackward>)
output :  tensor([[138775.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3153898.5000, grad_fn=<MseLossBackward>)
output :  tensor([[153445.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2415838.7500, grad_fn=<MseLossBackward>)
output :  tensor([[136130.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(17099.6484, grad_fn=<MseLossBackward>)
output :  tensor([[194963.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2276e+09, grad_fn=<MseLossBackward>)
output :  tensor([[155711.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2930409., grad_fn=<MseLossBackward>)
output :  tensor([[138837.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0555e+09, grad_fn=<MseLossBackward>)
output :  tensor([[143625.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1624111.2500, grad_fn=<MseLossBackward>)
output :  tensor([[212060.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(3688.6643, grad_fn=<MseLossBackward>)
output :  tensor([[104184.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9213e+08, grad_fn=<MseLossBackward>)
output :  tensor([[170167.]], grad_fn=<AddmmBackward>)
loss:  tensor(7112889., grad_fn=<MseLossBackward>)
output :  tensor([[128443.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(196851.6719, grad_fn=<MseLossBackward>)
output :  tensor([[146865.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(18048.2422, grad_fn=<MseLossBackward>)
output :  tensor([[106067.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9083e+09, grad_fn=<MseLossBackward>)
output :  tensor([[138061.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(315773.7500, grad_fn=<MseLossBackward>)
output :  tensor([[233521.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(6143891.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145408.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(167204.3281, grad_fn=<MseLossBackward>)
output :  tensor([[139872.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(5627718.5000, grad_fn=<MseLossBackward>)
output :  tensor([[165200.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3839e+09, grad_fn=<MseLossBackward>)
output :  tensor([[265135.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6549e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176145.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1312062.8750, grad_fn=<MseLossBackward>)
output :  tensor([[104715.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3760084.5000, grad_fn=<MseLossBackward>)
output :  tensor([[200919.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8646e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163938.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(24387548., grad_fn=<MseLossBackward>)
output :  tensor([[163720.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5670e+10, grad_fn=<MseLossBackward>)
output :  tensor([[98807.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(258048.1250, grad_fn=<MseLossBackward>)
output :  tensor([[124411.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(658189.9375, grad_fn=<MseLossBackward>)
output :  tensor([[152876.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(9753715., grad_fn=<MseLossBackward>)
output :  tensor([[141319.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1740461.7500, grad_fn=<MseLossBackward>)
output :  tensor([[203642.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(13267009., grad_fn=<MseLossBackward>)
output :  tensor([[146396.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(19329212., grad_fn=<MseLossBackward>)
output :  tensor([[262529.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(62156.7227, grad_fn=<MseLossBackward>)
output :  tensor([[128777.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2800e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164113.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1923118.8750, grad_fn=<MseLossBackward>)
output :  tensor([[188129.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(137270.2500, grad_fn=<MseLossBackward>)
output :  tensor([[122749.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6254e+08, grad_fn=<MseLossBackward>)
output :  tensor([[248965.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1069414.5000, grad_fn=<MseLossBackward>)
output :  tensor([[157429.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7440e+08, grad_fn=<MseLossBackward>)
output :  tensor([[241878.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(12053808., grad_fn=<MseLossBackward>)
output :  tensor([[145822.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3322189.7500, grad_fn=<MseLossBackward>)
output :  tensor([[209498.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(251141.9219, grad_fn=<MseLossBackward>)
output :  tensor([[171481.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(843010.8750, grad_fn=<MseLossBackward>)
output :  tensor([[153011.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(976638.0625, grad_fn=<MseLossBackward>)
output :  tensor([[119601.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(2565277.7500, grad_fn=<MseLossBackward>)
output :  tensor([[238812.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3307e+09, grad_fn=<MseLossBackward>)
output :  tensor([[239995.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(24.8440, grad_fn=<MseLossBackward>)
output :  tensor([[152410.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(857910.1250, grad_fn=<MseLossBackward>)
output :  tensor([[255532.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(400313.2500, grad_fn=<MseLossBackward>)
output :  tensor([[121609.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(50488240., grad_fn=<MseLossBackward>)
output :  tensor([[178022.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4092276.2500, grad_fn=<MseLossBackward>)
output :  tensor([[162313.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(5354162., grad_fn=<MseLossBackward>)
output :  tensor([[133764.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(7641078., grad_fn=<MseLossBackward>)
output :  tensor([[196019.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4248e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166574.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(6627165.5000, grad_fn=<MseLossBackward>)
output :  tensor([[158976.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(16191570., grad_fn=<MseLossBackward>)
output :  tensor([[156273.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2981935.2500, grad_fn=<MseLossBackward>)
output :  tensor([[152209.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(5335811.5000, grad_fn=<MseLossBackward>)
output :  tensor([[173857.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1420e+09, grad_fn=<MseLossBackward>)
output :  tensor([[162407.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(5796056., grad_fn=<MseLossBackward>)
output :  tensor([[373648.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0652e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135649.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(74811960., grad_fn=<MseLossBackward>)
output :  tensor([[129482.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9344e+09, grad_fn=<MseLossBackward>)
output :  tensor([[278314.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(8402570., grad_fn=<MseLossBackward>)
output :  tensor([[161955.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1983.0322, grad_fn=<MseLossBackward>)
output :  tensor([[132806.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5145e+08, grad_fn=<MseLossBackward>)
output :  tensor([[236712.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(22208246., grad_fn=<MseLossBackward>)
output :  tensor([[181695.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1429593.8750, grad_fn=<MseLossBackward>)
output :  tensor([[151908.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(8360.8164, grad_fn=<MseLossBackward>)
output :  tensor([[146007.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1015087.7500, grad_fn=<MseLossBackward>)
output :  tensor([[155367.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4103e+08, grad_fn=<MseLossBackward>)
output :  tensor([[100920.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(847392.1875, grad_fn=<MseLossBackward>)
output :  tensor([[77677.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1250e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165202.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(40854.5156, grad_fn=<MseLossBackward>)
output :  tensor([[187076.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6747e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157808.]], grad_fn=<AddmmBackward>)
loss:  tensor(36864., grad_fn=<MseLossBackward>)
output :  tensor([[164160.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(44356224., grad_fn=<MseLossBackward>)
output :  tensor([[141123.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(13496439., grad_fn=<MseLossBackward>)
output :  tensor([[203863.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4351657., grad_fn=<MseLossBackward>)
output :  tensor([[138383.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(146808.7188, grad_fn=<MseLossBackward>)
output :  tensor([[182223.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6327e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144483.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2299156.2500, grad_fn=<MseLossBackward>)
output :  tensor([[110385.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4998e+08, grad_fn=<MseLossBackward>)
output :  tensor([[94855.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(731185.3125, grad_fn=<MseLossBackward>)
output :  tensor([[174988.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(127.6194, grad_fn=<MseLossBackward>)
output :  tensor([[263199.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(7835800.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140731.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(590616.2500, grad_fn=<MseLossBackward>)
output :  tensor([[159631.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(69671.2500, grad_fn=<MseLossBackward>)
output :  tensor([[134630.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(4539696., grad_fn=<MseLossBackward>)
output :  tensor([[151792.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(5257562.5000, grad_fn=<MseLossBackward>)
output :  tensor([[171927.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(16224532., grad_fn=<MseLossBackward>)
output :  tensor([[126643.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(127136.8125, grad_fn=<MseLossBackward>)
output :  tensor([[172726.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6876e+08, grad_fn=<MseLossBackward>)
output :  tensor([[156557.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(195626.5312, grad_fn=<MseLossBackward>)
output :  tensor([[116425.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(5506.1035, grad_fn=<MseLossBackward>)
output :  tensor([[160465.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2613e+09, grad_fn=<MseLossBackward>)
output :  tensor([[55602.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(12975924., grad_fn=<MseLossBackward>)
output :  tensor([[233645.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2181e+09, grad_fn=<MseLossBackward>)
output :  tensor([[197765.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(10463709., grad_fn=<MseLossBackward>)
output :  tensor([[183540.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2129228.2500, grad_fn=<MseLossBackward>)
output :  tensor([[106626.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(392835.1562, grad_fn=<MseLossBackward>)
output :  tensor([[89288.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(5235766.5000, grad_fn=<MseLossBackward>)
output :  tensor([[141235.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1526691.8750, grad_fn=<MseLossBackward>)
output :  tensor([[219066.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6150e+09, grad_fn=<MseLossBackward>)
output :  tensor([[202007.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(30164982., grad_fn=<MseLossBackward>)
output :  tensor([[166393.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1941450.3750, grad_fn=<MseLossBackward>)
output :  tensor([[171351.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7700e+09, grad_fn=<MseLossBackward>)
output :  tensor([[189183.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(666136.5000, grad_fn=<MseLossBackward>)
output :  tensor([[87668.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(446693.8125, grad_fn=<MseLossBackward>)
output :  tensor([[138008.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(3964516.5000, grad_fn=<MseLossBackward>)
output :  tensor([[110948.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(200949.0781, grad_fn=<MseLossBackward>)
output :  tensor([[149904.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9446e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173789.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8309e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193741.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2675e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178102.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3601395.7500, grad_fn=<MseLossBackward>)
output :  tensor([[98409.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(3647145., grad_fn=<MseLossBackward>)
output :  tensor([[116742.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(573960.1250, grad_fn=<MseLossBackward>)
output :  tensor([[162315.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7020e+08, grad_fn=<MseLossBackward>)
output :  tensor([[202121.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(4499370., grad_fn=<MseLossBackward>)
output :  tensor([[145403.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1970557.8750, grad_fn=<MseLossBackward>)
train_loss: [2.6368858e+09]
epoch_result tensor([0.])
output :  tensor([[153514.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(24856768., grad_fn=<MseLossBackward>)
output :  tensor([[124749.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(7562285., grad_fn=<MseLossBackward>)
output :  tensor([[195347.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1315465.6250, grad_fn=<MseLossBackward>)
output :  tensor([[177161.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(26178.2285, grad_fn=<MseLossBackward>)
output :  tensor([[153556.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9747e+08, grad_fn=<MseLossBackward>)
output :  tensor([[124770.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(10429014., grad_fn=<MseLossBackward>)
output :  tensor([[139781.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1483790.5000, grad_fn=<MseLossBackward>)
output :  tensor([[117984.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(1032144.8750, grad_fn=<MseLossBackward>)
output :  tensor([[67909.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(88546920., grad_fn=<MseLossBackward>)
output :  tensor([[166107.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(11559.6094, grad_fn=<MseLossBackward>)
output :  tensor([[137816.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(4769515., grad_fn=<MseLossBackward>)
output :  tensor([[225828.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(685739.2500, grad_fn=<MseLossBackward>)
output :  tensor([[166149.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(8125706.5000, grad_fn=<MseLossBackward>)
output :  tensor([[250999.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1688700.2500, grad_fn=<MseLossBackward>)
output :  tensor([[54612.6133]], grad_fn=<AddmmBackward>)
loss:  tensor(150068.4688, grad_fn=<MseLossBackward>)
output :  tensor([[162522.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2480e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179288.]], grad_fn=<AddmmBackward>)
loss:  tensor(18386944., grad_fn=<MseLossBackward>)
output :  tensor([[144562.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4251e+08, grad_fn=<MseLossBackward>)
output :  tensor([[277478.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(6145286., grad_fn=<MseLossBackward>)
output :  tensor([[193937.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(9379768., grad_fn=<MseLossBackward>)
output :  tensor([[135446.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6759e+10, grad_fn=<MseLossBackward>)
output :  tensor([[195766.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3564249., grad_fn=<MseLossBackward>)
output :  tensor([[178741.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1306e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150134.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(749496., grad_fn=<MseLossBackward>)
output :  tensor([[175437.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(29563178., grad_fn=<MseLossBackward>)
output :  tensor([[86666.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1602953.8750, grad_fn=<MseLossBackward>)
output :  tensor([[169774.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2233e+09, grad_fn=<MseLossBackward>)
output :  tensor([[188612.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(13050608., grad_fn=<MseLossBackward>)
output :  tensor([[205613.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4887e+09, grad_fn=<MseLossBackward>)
output :  tensor([[108906.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(1195998.5000, grad_fn=<MseLossBackward>)
output :  tensor([[170666.]], grad_fn=<AddmmBackward>)
loss:  tensor(111556., grad_fn=<MseLossBackward>)
output :  tensor([[137686.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1408598.1250, grad_fn=<MseLossBackward>)
output :  tensor([[128393.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(367993.8750, grad_fn=<MseLossBackward>)
output :  tensor([[120796.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1681236.3750, grad_fn=<MseLossBackward>)
output :  tensor([[148433.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(9.8806e+08, grad_fn=<MseLossBackward>)
output :  tensor([[169592.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1143e+10, grad_fn=<MseLossBackward>)
output :  tensor([[152087.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(5700529.5000, grad_fn=<MseLossBackward>)
output :  tensor([[181736.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(3015161., grad_fn=<MseLossBackward>)
output :  tensor([[144919.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(15360643., grad_fn=<MseLossBackward>)
output :  tensor([[107155.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9432e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136964.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0895e+09, grad_fn=<MseLossBackward>)
output :  tensor([[134796.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(41278.8125, grad_fn=<MseLossBackward>)
output :  tensor([[130745.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(14026722., grad_fn=<MseLossBackward>)
output :  tensor([[222859.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(4583747., grad_fn=<MseLossBackward>)
output :  tensor([[134620.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(5619122., grad_fn=<MseLossBackward>)
output :  tensor([[152108.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(9664327., grad_fn=<MseLossBackward>)
output :  tensor([[113439.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(2071058.2500, grad_fn=<MseLossBackward>)
output :  tensor([[157455.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(6474480., grad_fn=<MseLossBackward>)
output :  tensor([[146129.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3883e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194647.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(7010001., grad_fn=<MseLossBackward>)
output :  tensor([[135454.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1008361.1250, grad_fn=<MseLossBackward>)
output :  tensor([[123280.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7637e+08, grad_fn=<MseLossBackward>)
output :  tensor([[230312.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(13595928., grad_fn=<MseLossBackward>)
output :  tensor([[164441.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4057e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163044.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(16358991., grad_fn=<MseLossBackward>)
output :  tensor([[204294.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8293e+10, grad_fn=<MseLossBackward>)
output :  tensor([[245363.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1802e+10, grad_fn=<MseLossBackward>)
output :  tensor([[142287.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1469398.5000, grad_fn=<MseLossBackward>)
output :  tensor([[137268.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(10682173., grad_fn=<MseLossBackward>)
output :  tensor([[156385.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1920389.6250, grad_fn=<MseLossBackward>)
output :  tensor([[133444.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(11866195., grad_fn=<MseLossBackward>)
output :  tensor([[178673.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6139e+09, grad_fn=<MseLossBackward>)
output :  tensor([[184871.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(595477.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162284.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(615611.8750, grad_fn=<MseLossBackward>)
output :  tensor([[153975.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2045e+08, grad_fn=<MseLossBackward>)
output :  tensor([[141754.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(555583.8750, grad_fn=<MseLossBackward>)
output :  tensor([[139835.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(26669156., grad_fn=<MseLossBackward>)
output :  tensor([[173084.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4357e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193515.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5153e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136495.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(23.1602, grad_fn=<MseLossBackward>)
output :  tensor([[168678.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(10378465., grad_fn=<MseLossBackward>)
output :  tensor([[178590.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(5804410.5000, grad_fn=<MseLossBackward>)
output :  tensor([[116882.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(3543276.7500, grad_fn=<MseLossBackward>)
output :  tensor([[220582.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(174188.8438, grad_fn=<MseLossBackward>)
output :  tensor([[180521.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(8870531., grad_fn=<MseLossBackward>)
output :  tensor([[128612.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(9684593., grad_fn=<MseLossBackward>)
output :  tensor([[193143.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(11268295., grad_fn=<MseLossBackward>)
output :  tensor([[174311.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(346461., grad_fn=<MseLossBackward>)
output :  tensor([[206755.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2218e+10, grad_fn=<MseLossBackward>)
output :  tensor([[207504.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(12219722., grad_fn=<MseLossBackward>)
output :  tensor([[165936.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2206e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195526.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1054023., grad_fn=<MseLossBackward>)
output :  tensor([[113584.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(342124.4688, grad_fn=<MseLossBackward>)
output :  tensor([[115842.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(11171627., grad_fn=<MseLossBackward>)
output :  tensor([[111420.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(336390.9375, grad_fn=<MseLossBackward>)
output :  tensor([[148696.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3598312.5000, grad_fn=<MseLossBackward>)
output :  tensor([[159914.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3390e+10, grad_fn=<MseLossBackward>)
output :  tensor([[182830.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(8012172.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128545.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(1092825.2500, grad_fn=<MseLossBackward>)
output :  tensor([[145785.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(617231.1875, grad_fn=<MseLossBackward>)
output :  tensor([[184834.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4935e+09, grad_fn=<MseLossBackward>)
output :  tensor([[116674.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(50991.2852, grad_fn=<MseLossBackward>)
output :  tensor([[192451.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(20690274., grad_fn=<MseLossBackward>)
output :  tensor([[142757.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(5030278., grad_fn=<MseLossBackward>)
output :  tensor([[208539.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(19011644., grad_fn=<MseLossBackward>)
output :  tensor([[126104.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(10835.5088, grad_fn=<MseLossBackward>)
output :  tensor([[248554.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(51266.8672, grad_fn=<MseLossBackward>)
output :  tensor([[235071.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4929e+09, grad_fn=<MseLossBackward>)
output :  tensor([[149293.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2017e+08, grad_fn=<MseLossBackward>)
output :  tensor([[85437.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9718e+08, grad_fn=<MseLossBackward>)
output :  tensor([[191457.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9626e+09, grad_fn=<MseLossBackward>)
output :  tensor([[80228.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(594850.6875, grad_fn=<MseLossBackward>)
output :  tensor([[138967.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(283939.1250, grad_fn=<MseLossBackward>)
output :  tensor([[76779.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1637880., grad_fn=<MseLossBackward>)
output :  tensor([[140331.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(6871443., grad_fn=<MseLossBackward>)
output :  tensor([[177160.]], grad_fn=<AddmmBackward>)
loss:  tensor(1345600., grad_fn=<MseLossBackward>)
output :  tensor([[153305.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(37696.6484, grad_fn=<MseLossBackward>)
output :  tensor([[106742.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(432912.5938, grad_fn=<MseLossBackward>)
output :  tensor([[204360.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2408e+10, grad_fn=<MseLossBackward>)
output :  tensor([[132333.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(14695243., grad_fn=<MseLossBackward>)
output :  tensor([[267823.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4828e+08, grad_fn=<MseLossBackward>)
output :  tensor([[300988.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(81211072., grad_fn=<MseLossBackward>)
output :  tensor([[107492.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(55.2003, grad_fn=<MseLossBackward>)
output :  tensor([[172637.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(18876.1836, grad_fn=<MseLossBackward>)
output :  tensor([[134992.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2861e+08, grad_fn=<MseLossBackward>)
output :  tensor([[139029.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(847.3557, grad_fn=<MseLossBackward>)
output :  tensor([[129894.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(126097.1172, grad_fn=<MseLossBackward>)
output :  tensor([[127175.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4734704., grad_fn=<MseLossBackward>)
output :  tensor([[135736.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8834e+08, grad_fn=<MseLossBackward>)
output :  tensor([[227250.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8318e+10, grad_fn=<MseLossBackward>)
output :  tensor([[189548.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2937e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144003.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(10679.9307, grad_fn=<MseLossBackward>)
output :  tensor([[125726.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(3144221.5000, grad_fn=<MseLossBackward>)
output :  tensor([[111380.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(16985.4199, grad_fn=<MseLossBackward>)
output :  tensor([[254016.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1017e+09, grad_fn=<MseLossBackward>)
output :  tensor([[134546.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(205676.4219, grad_fn=<MseLossBackward>)
output :  tensor([[201020.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(3919657.5000, grad_fn=<MseLossBackward>)
output :  tensor([[107076.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(4738240.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138511.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2068742.8750, grad_fn=<MseLossBackward>)
output :  tensor([[207290.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9617e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179831.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(4687.9697, grad_fn=<MseLossBackward>)
output :  tensor([[187205.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(4865677.5000, grad_fn=<MseLossBackward>)
output :  tensor([[164358.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0921e+10, grad_fn=<MseLossBackward>)
output :  tensor([[292804.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7804e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195600.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(5289712.5000, grad_fn=<MseLossBackward>)
output :  tensor([[260180.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0358e+10, grad_fn=<MseLossBackward>)
output :  tensor([[220969.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0278e+09, grad_fn=<MseLossBackward>)
output :  tensor([[280749.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3141e+09, grad_fn=<MseLossBackward>)
output :  tensor([[226348.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(5513617.5000, grad_fn=<MseLossBackward>)
output :  tensor([[222952.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8577e+10, grad_fn=<MseLossBackward>)
output :  tensor([[198639.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2687089.2500, grad_fn=<MseLossBackward>)
output :  tensor([[159575.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(9.3489e+08, grad_fn=<MseLossBackward>)
output :  tensor([[132132.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(134872.5625, grad_fn=<MseLossBackward>)
output :  tensor([[134103.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1951434.3750, grad_fn=<MseLossBackward>)
output :  tensor([[91034.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(1177.8838, grad_fn=<MseLossBackward>)
output :  tensor([[105903.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(4395509., grad_fn=<MseLossBackward>)
output :  tensor([[271165.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3333e+09, grad_fn=<MseLossBackward>)
output :  tensor([[234097.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(814647.2500, grad_fn=<MseLossBackward>)
output :  tensor([[144379.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(384806.9688, grad_fn=<MseLossBackward>)
output :  tensor([[133972.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(12440060., grad_fn=<MseLossBackward>)
output :  tensor([[176648.]], grad_fn=<AddmmBackward>)
loss:  tensor(8497225., grad_fn=<MseLossBackward>)
output :  tensor([[146264.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1029368.7500, grad_fn=<MseLossBackward>)
output :  tensor([[165071.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(8.6605e+08, grad_fn=<MseLossBackward>)
output :  tensor([[164945.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2944.7581, grad_fn=<MseLossBackward>)
output :  tensor([[138051.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1105290.8750, grad_fn=<MseLossBackward>)
output :  tensor([[188379.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3402e+09, grad_fn=<MseLossBackward>)
output :  tensor([[112721.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(520460.7812, grad_fn=<MseLossBackward>)
output :  tensor([[166361.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(31794092., grad_fn=<MseLossBackward>)
output :  tensor([[123656.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(13372678., grad_fn=<MseLossBackward>)
output :  tensor([[87851.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(725557.9375, grad_fn=<MseLossBackward>)
output :  tensor([[179154.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(714711.7500, grad_fn=<MseLossBackward>)
output :  tensor([[110413.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(263666.2188, grad_fn=<MseLossBackward>)
output :  tensor([[234027.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(24729796., grad_fn=<MseLossBackward>)
output :  tensor([[244709.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(84235.9922, grad_fn=<MseLossBackward>)
output :  tensor([[131859.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(5567682.5000, grad_fn=<MseLossBackward>)
output :  tensor([[110007.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(1098942.7500, grad_fn=<MseLossBackward>)
output :  tensor([[287462.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2407e+10, grad_fn=<MseLossBackward>)
output :  tensor([[176484.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(24842436., grad_fn=<MseLossBackward>)
output :  tensor([[125775.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(601545.6875, grad_fn=<MseLossBackward>)
output :  tensor([[146479.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1107e+08, grad_fn=<MseLossBackward>)
output :  tensor([[202183.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3963e+08, grad_fn=<MseLossBackward>)
output :  tensor([[141501.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(251753.0625, grad_fn=<MseLossBackward>)
output :  tensor([[158953.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4652e+10, grad_fn=<MseLossBackward>)
output :  tensor([[153939.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1552.8525, grad_fn=<MseLossBackward>)
output :  tensor([[128206.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1673465.6250, grad_fn=<MseLossBackward>)
output :  tensor([[244301.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8009e+10, grad_fn=<MseLossBackward>)
output :  tensor([[397649.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(18925490., grad_fn=<MseLossBackward>)
output :  tensor([[111030.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(4124548.5000, grad_fn=<MseLossBackward>)
output :  tensor([[121854.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(11253404., grad_fn=<MseLossBackward>)
output :  tensor([[159452.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2280.0625, grad_fn=<MseLossBackward>)
output :  tensor([[131191.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2023e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163248.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4517e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173029.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9727e+09, grad_fn=<MseLossBackward>)
output :  tensor([[105348.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(3056651.2500, grad_fn=<MseLossBackward>)
output :  tensor([[142077.]], grad_fn=<AddmmBackward>)
loss:  tensor(1159929., grad_fn=<MseLossBackward>)
output :  tensor([[369899.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(6788956., grad_fn=<MseLossBackward>)
output :  tensor([[201376.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7693e+09, grad_fn=<MseLossBackward>)
output :  tensor([[175430.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(4878.1494, grad_fn=<MseLossBackward>)
output :  tensor([[208247.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(28600602., grad_fn=<MseLossBackward>)
output :  tensor([[140042.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1086350.2500, grad_fn=<MseLossBackward>)
output :  tensor([[196259.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3094191., grad_fn=<MseLossBackward>)
output :  tensor([[136385.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3437e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177889.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(9674627., grad_fn=<MseLossBackward>)
output :  tensor([[240274.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2978536.7500, grad_fn=<MseLossBackward>)
output :  tensor([[168803.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(27007022., grad_fn=<MseLossBackward>)
output :  tensor([[109811.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(3280400.2500, grad_fn=<MseLossBackward>)
output :  tensor([[264546.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(216.6416, grad_fn=<MseLossBackward>)
output :  tensor([[252216.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(4912387.5000, grad_fn=<MseLossBackward>)
output :  tensor([[120358.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(6977357., grad_fn=<MseLossBackward>)
output :  tensor([[213418.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7923e+09, grad_fn=<MseLossBackward>)
output :  tensor([[301426.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6994e+08, grad_fn=<MseLossBackward>)
output :  tensor([[205795.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1451761.3750, grad_fn=<MseLossBackward>)
output :  tensor([[215421.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5520e+10, grad_fn=<MseLossBackward>)
output :  tensor([[161280.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(11429682., grad_fn=<MseLossBackward>)
output :  tensor([[170803.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(661528.0625, grad_fn=<MseLossBackward>)
output :  tensor([[163276.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(40248120., grad_fn=<MseLossBackward>)
output :  tensor([[169987.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(155.8596, grad_fn=<MseLossBackward>)
output :  tensor([[235186.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0767e+09, grad_fn=<MseLossBackward>)
output :  tensor([[215916.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8332e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163245.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6392e+08, grad_fn=<MseLossBackward>)
output :  tensor([[123306.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(93765.1406, grad_fn=<MseLossBackward>)
output :  tensor([[176755.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(59642.7969, grad_fn=<MseLossBackward>)
output :  tensor([[183637.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8312e+09, grad_fn=<MseLossBackward>)
output :  tensor([[205435.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5790e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134343.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(7901.5430, grad_fn=<MseLossBackward>)
output :  tensor([[152589.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6033e+08, grad_fn=<MseLossBackward>)
output :  tensor([[283429.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(41335656., grad_fn=<MseLossBackward>)
output :  tensor([[88226.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(10412420., grad_fn=<MseLossBackward>)
output :  tensor([[236096.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(163190.7500, grad_fn=<MseLossBackward>)
output :  tensor([[259350.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0471e+11, grad_fn=<MseLossBackward>)
output :  tensor([[170572.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(327702.5938, grad_fn=<MseLossBackward>)
output :  tensor([[193722.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7039e+09, grad_fn=<MseLossBackward>)
output :  tensor([[153873.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1269319.1250, grad_fn=<MseLossBackward>)
output :  tensor([[207349.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9251e+09, grad_fn=<MseLossBackward>)
output :  tensor([[132490.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(12183590., grad_fn=<MseLossBackward>)
output :  tensor([[143250.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(3062281.2500, grad_fn=<MseLossBackward>)
output :  tensor([[171043.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1476e+08, grad_fn=<MseLossBackward>)
output :  tensor([[184719.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1277253.1250, grad_fn=<MseLossBackward>)
output :  tensor([[128625.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(6892963., grad_fn=<MseLossBackward>)
output :  tensor([[138825.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(5410058., grad_fn=<MseLossBackward>)
output :  tensor([[179838.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(46768500., grad_fn=<MseLossBackward>)
output :  tensor([[198577.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6443e+09, grad_fn=<MseLossBackward>)
output :  tensor([[243108.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(11860.5713, grad_fn=<MseLossBackward>)
output :  tensor([[153865.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1286771.2500, grad_fn=<MseLossBackward>)
output :  tensor([[194945.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1111443., grad_fn=<MseLossBackward>)
output :  tensor([[163973.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9895e+08, grad_fn=<MseLossBackward>)
output :  tensor([[190449.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1990e+08, grad_fn=<MseLossBackward>)
output :  tensor([[184325.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(19581592., grad_fn=<MseLossBackward>)
output :  tensor([[102685.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(32328198., grad_fn=<MseLossBackward>)
output :  tensor([[174983.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1029e+10, grad_fn=<MseLossBackward>)
output :  tensor([[137256.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(5092709., grad_fn=<MseLossBackward>)
output :  tensor([[122601.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(57790284., grad_fn=<MseLossBackward>)
output :  tensor([[175395.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1947943.6250, grad_fn=<MseLossBackward>)
output :  tensor([[85635.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(403661.6875, grad_fn=<MseLossBackward>)
output :  tensor([[290350.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(122828.3438, grad_fn=<MseLossBackward>)
output :  tensor([[165481.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(231917.4844, grad_fn=<MseLossBackward>)
output :  tensor([[188754.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0855e+10, grad_fn=<MseLossBackward>)
output :  tensor([[244438.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0551e+08, grad_fn=<MseLossBackward>)
output :  tensor([[152385.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1918311.6250, grad_fn=<MseLossBackward>)
output :  tensor([[123749.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(62969.6289, grad_fn=<MseLossBackward>)
output :  tensor([[121614.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2941010.7500, grad_fn=<MseLossBackward>)
output :  tensor([[145091.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(9.0549e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177108.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(9660150., grad_fn=<MseLossBackward>)
output :  tensor([[113361.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(9.5242e+08, grad_fn=<MseLossBackward>)
output :  tensor([[207759.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2153e+10, grad_fn=<MseLossBackward>)
output :  tensor([[236055.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(29638838., grad_fn=<MseLossBackward>)
output :  tensor([[249519.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1220e+10, grad_fn=<MseLossBackward>)
output :  tensor([[223043.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5461e+08, grad_fn=<MseLossBackward>)
output :  tensor([[195829.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4321e+10, grad_fn=<MseLossBackward>)
output :  tensor([[188242.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(550842.3125, grad_fn=<MseLossBackward>)
output :  tensor([[205772.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8004e+10, grad_fn=<MseLossBackward>)
output :  tensor([[189337.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1510e+10, grad_fn=<MseLossBackward>)
output :  tensor([[178977.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(56250.5000, grad_fn=<MseLossBackward>)
output :  tensor([[151755.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(59566.5039, grad_fn=<MseLossBackward>)
output :  tensor([[334679.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(5383270., grad_fn=<MseLossBackward>)
output :  tensor([[211688.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(97051.7188, grad_fn=<MseLossBackward>)
output :  tensor([[163562.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(12693633., grad_fn=<MseLossBackward>)
output :  tensor([[185708.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1127e+09, grad_fn=<MseLossBackward>)
output :  tensor([[106868.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(3490650., grad_fn=<MseLossBackward>)
output :  tensor([[269241.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1658e+10, grad_fn=<MseLossBackward>)
output :  tensor([[174349.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(201615.0312, grad_fn=<MseLossBackward>)
output :  tensor([[217112.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(13046657., grad_fn=<MseLossBackward>)
output :  tensor([[207256.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8888e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179006.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(37345.5625, grad_fn=<MseLossBackward>)
output :  tensor([[200370.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2044274.3750, grad_fn=<MseLossBackward>)
output :  tensor([[154177.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(677200.4375, grad_fn=<MseLossBackward>)
output :  tensor([[149454.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4457e+09, grad_fn=<MseLossBackward>)
output :  tensor([[120340.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(3387986.7500, grad_fn=<MseLossBackward>)
output :  tensor([[138962.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1075790.3750, grad_fn=<MseLossBackward>)
output :  tensor([[146283.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(7380221., grad_fn=<MseLossBackward>)
output :  tensor([[201309.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6051e+10, grad_fn=<MseLossBackward>)
output :  tensor([[162079.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(6655271.5000, grad_fn=<MseLossBackward>)
output :  tensor([[101744.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(5036518., grad_fn=<MseLossBackward>)
output :  tensor([[223510.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7191e+08, grad_fn=<MseLossBackward>)
output :  tensor([[187357.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7777e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176011.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(223950.7812, grad_fn=<MseLossBackward>)
output :  tensor([[82302.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(91222.8750, grad_fn=<MseLossBackward>)
output :  tensor([[129153.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(427685.3438, grad_fn=<MseLossBackward>)
output :  tensor([[211327.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(7140836.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144464.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(215978.0469, grad_fn=<MseLossBackward>)
output :  tensor([[133458.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(11959493., grad_fn=<MseLossBackward>)
output :  tensor([[142274.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(105828.2188, grad_fn=<MseLossBackward>)
output :  tensor([[179910.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7987e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144407.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(165712.5938, grad_fn=<MseLossBackward>)
output :  tensor([[158859.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1301274.8750, grad_fn=<MseLossBackward>)
output :  tensor([[216227.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1506104.2500, grad_fn=<MseLossBackward>)
output :  tensor([[138352.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1124e+09, grad_fn=<MseLossBackward>)
output :  tensor([[258000.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(9001313., grad_fn=<MseLossBackward>)
output :  tensor([[160792.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1670960.1250, grad_fn=<MseLossBackward>)
output :  tensor([[127244.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(1577241.6250, grad_fn=<MseLossBackward>)
output :  tensor([[97641.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(6978843., grad_fn=<MseLossBackward>)
output :  tensor([[155883.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0956e+09, grad_fn=<MseLossBackward>)
output :  tensor([[180189.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(83774.0625, grad_fn=<MseLossBackward>)
output :  tensor([[121035.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(287028.0625, grad_fn=<MseLossBackward>)
output :  tensor([[185602.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8790e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146322.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4653e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151131.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1515861.1250, grad_fn=<MseLossBackward>)
output :  tensor([[188254.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(254299.5781, grad_fn=<MseLossBackward>)
output :  tensor([[251770.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7062e+09, grad_fn=<MseLossBackward>)
output :  tensor([[92613.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1239743.1250, grad_fn=<MseLossBackward>)
output :  tensor([[236426.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(12773253., grad_fn=<MseLossBackward>)
output :  tensor([[128966.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(217345.3594, grad_fn=<MseLossBackward>)
output :  tensor([[166875.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(9.8059e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113639.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8604e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175341.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(433807.4688, grad_fn=<MseLossBackward>)
output :  tensor([[163317.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7206e+08, grad_fn=<MseLossBackward>)
output :  tensor([[155009.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0071e+08, grad_fn=<MseLossBackward>)
output :  tensor([[237541.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2126538.7500, grad_fn=<MseLossBackward>)
output :  tensor([[225274.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0709e+09, grad_fn=<MseLossBackward>)
output :  tensor([[126385.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(377600.6562, grad_fn=<MseLossBackward>)
output :  tensor([[125184.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(664696.2500, grad_fn=<MseLossBackward>)
output :  tensor([[222643.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(18979364., grad_fn=<MseLossBackward>)
output :  tensor([[228690.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(28194606., grad_fn=<MseLossBackward>)
output :  tensor([[223127.]], grad_fn=<AddmmBackward>)
loss:  tensor(12766329., grad_fn=<MseLossBackward>)
output :  tensor([[147696.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(91846.8750, grad_fn=<MseLossBackward>)
output :  tensor([[204783.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(27213176., grad_fn=<MseLossBackward>)
output :  tensor([[128922.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(79604312., grad_fn=<MseLossBackward>)
output :  tensor([[134825.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(5408459., grad_fn=<MseLossBackward>)
output :  tensor([[309086.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(34969112., grad_fn=<MseLossBackward>)
output :  tensor([[139186.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(3288952.2500, grad_fn=<MseLossBackward>)
output :  tensor([[122928.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1280e+09, grad_fn=<MseLossBackward>)
output :  tensor([[108024.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2178530., grad_fn=<MseLossBackward>)
output :  tensor([[155931.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7452e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177364.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(9.4791e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173809.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(655239.6875, grad_fn=<MseLossBackward>)
output :  tensor([[188950.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4518e+08, grad_fn=<MseLossBackward>)
output :  tensor([[103233.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(10456937., grad_fn=<MseLossBackward>)
output :  tensor([[181424.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(5876533.5000, grad_fn=<MseLossBackward>)
output :  tensor([[167726.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(30140.2148, grad_fn=<MseLossBackward>)
output :  tensor([[140998.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(3995251.5000, grad_fn=<MseLossBackward>)
output :  tensor([[263150.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2064e+09, grad_fn=<MseLossBackward>)
output :  tensor([[143721.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4482e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174340.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1796437.6250, grad_fn=<MseLossBackward>)
output :  tensor([[142643.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(6988753., grad_fn=<MseLossBackward>)
output :  tensor([[196739.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(14140068., grad_fn=<MseLossBackward>)
output :  tensor([[167802.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(4828869., grad_fn=<MseLossBackward>)
output :  tensor([[240916.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(9510863., grad_fn=<MseLossBackward>)
output :  tensor([[133544.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(913846.3750, grad_fn=<MseLossBackward>)
output :  tensor([[148970.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(143783.1562, grad_fn=<MseLossBackward>)
output :  tensor([[211327.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(13488863., grad_fn=<MseLossBackward>)
output :  tensor([[161279.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(13842237., grad_fn=<MseLossBackward>)
output :  tensor([[194187.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(26911292., grad_fn=<MseLossBackward>)
output :  tensor([[133903.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2981e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129502.]], grad_fn=<AddmmBackward>)
loss:  tensor(252004., grad_fn=<MseLossBackward>)
output :  tensor([[136230.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(14205479., grad_fn=<MseLossBackward>)
output :  tensor([[200400.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7748e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166787.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6819e+09, grad_fn=<MseLossBackward>)
output :  tensor([[76611.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7593e+08, grad_fn=<MseLossBackward>)
output :  tensor([[96863.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5287e+08, grad_fn=<MseLossBackward>)
output :  tensor([[254717.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2029066.7500, grad_fn=<MseLossBackward>)
output :  tensor([[203710.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1875e+09, grad_fn=<MseLossBackward>)
output :  tensor([[115108.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(11877.5938, grad_fn=<MseLossBackward>)
output :  tensor([[159728.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7124e+08, grad_fn=<MseLossBackward>)
output :  tensor([[206068.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9410e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180109.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0803e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158269.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(10691265., grad_fn=<MseLossBackward>)
output :  tensor([[168860.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1298531.5000, grad_fn=<MseLossBackward>)
output :  tensor([[116042.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(1086431.6250, grad_fn=<MseLossBackward>)
output :  tensor([[163916.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(79499792., grad_fn=<MseLossBackward>)
output :  tensor([[192483.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0785e+08, grad_fn=<MseLossBackward>)
output :  tensor([[219751.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(63173.6797, grad_fn=<MseLossBackward>)
output :  tensor([[246346.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4865e+11, grad_fn=<MseLossBackward>)
output :  tensor([[145446.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2414673.2500, grad_fn=<MseLossBackward>)
output :  tensor([[110432.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(3811646., grad_fn=<MseLossBackward>)
output :  tensor([[169950.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4278e+08, grad_fn=<MseLossBackward>)
output :  tensor([[152614.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(4469260.5000, grad_fn=<MseLossBackward>)
output :  tensor([[232758.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(17990720., grad_fn=<MseLossBackward>)
output :  tensor([[115008.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(69.2276, grad_fn=<MseLossBackward>)
output :  tensor([[176484.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(41156836., grad_fn=<MseLossBackward>)
output :  tensor([[187802.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1216195.3750, grad_fn=<MseLossBackward>)
output :  tensor([[164908.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4053e+10, grad_fn=<MseLossBackward>)
output :  tensor([[95788.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1870e+08, grad_fn=<MseLossBackward>)
output :  tensor([[239556.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(309900.9688, grad_fn=<MseLossBackward>)
output :  tensor([[179429.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(11763185., grad_fn=<MseLossBackward>)
output :  tensor([[139334.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(442391.2500, grad_fn=<MseLossBackward>)
output :  tensor([[234868.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(17242.9727, grad_fn=<MseLossBackward>)
output :  tensor([[161499.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2250375., grad_fn=<MseLossBackward>)
output :  tensor([[201963.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5138e+10, grad_fn=<MseLossBackward>)
output :  tensor([[135278.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(77396.9766, grad_fn=<MseLossBackward>)
output :  tensor([[187922.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7195e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134280.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2955928., grad_fn=<MseLossBackward>)
output :  tensor([[223632.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5295e+08, grad_fn=<MseLossBackward>)
output :  tensor([[224983.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2583e+08, grad_fn=<MseLossBackward>)
output :  tensor([[91235.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(1526286.5000, grad_fn=<MseLossBackward>)
output :  tensor([[160485.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1105093.7500, grad_fn=<MseLossBackward>)
output :  tensor([[242696.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6431e+10, grad_fn=<MseLossBackward>)
output :  tensor([[149354.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(18957452., grad_fn=<MseLossBackward>)
output :  tensor([[109965.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8461e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164665.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(27431.6406, grad_fn=<MseLossBackward>)
output :  tensor([[141338.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(7085162.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128831.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(398920.5312, grad_fn=<MseLossBackward>)
output :  tensor([[189554.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8227e+09, grad_fn=<MseLossBackward>)
output :  tensor([[124439.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(3761872.5000, grad_fn=<MseLossBackward>)
output :  tensor([[152734.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(539582.0625, grad_fn=<MseLossBackward>)
output :  tensor([[168154.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(12930092., grad_fn=<MseLossBackward>)
output :  tensor([[151454.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(206925.4844, grad_fn=<MseLossBackward>)
output :  tensor([[163846.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(895329.9375, grad_fn=<MseLossBackward>)
output :  tensor([[134938.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7282e+08, grad_fn=<MseLossBackward>)
output :  tensor([[132628.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(394521.3750, grad_fn=<MseLossBackward>)
output :  tensor([[155909.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8594e+08, grad_fn=<MseLossBackward>)
output :  tensor([[145646.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2234744.7500, grad_fn=<MseLossBackward>)
output :  tensor([[163799.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(4199746., grad_fn=<MseLossBackward>)
output :  tensor([[140627.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(9.4416e+08, grad_fn=<MseLossBackward>)
output :  tensor([[151204.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(5783799.5000, grad_fn=<MseLossBackward>)
output :  tensor([[184439.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(12675603., grad_fn=<MseLossBackward>)
output :  tensor([[170648.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2718273.5000, grad_fn=<MseLossBackward>)
output :  tensor([[180168.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(28513.4883, grad_fn=<MseLossBackward>)
output :  tensor([[220858.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(737719.9375, grad_fn=<MseLossBackward>)
output :  tensor([[110316.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(5840605., grad_fn=<MseLossBackward>)
output :  tensor([[140916.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5652e+08, grad_fn=<MseLossBackward>)
output :  tensor([[283508.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(6208974., grad_fn=<MseLossBackward>)
output :  tensor([[116678.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(460500.0938, grad_fn=<MseLossBackward>)
output :  tensor([[174341.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0847e+09, grad_fn=<MseLossBackward>)
output :  tensor([[179104.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(34758764., grad_fn=<MseLossBackward>)
output :  tensor([[175899.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(92177400., grad_fn=<MseLossBackward>)
output :  tensor([[250841.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8361e+08, grad_fn=<MseLossBackward>)
output :  tensor([[219232.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(7660613., grad_fn=<MseLossBackward>)
output :  tensor([[127240.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5540e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175884.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2372e+08, grad_fn=<MseLossBackward>)
output :  tensor([[124893.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(797797.8750, grad_fn=<MseLossBackward>)
output :  tensor([[182400.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5730e+10, grad_fn=<MseLossBackward>)
output :  tensor([[152069.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(866615.5625, grad_fn=<MseLossBackward>)
output :  tensor([[154263.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(60275088., grad_fn=<MseLossBackward>)
output :  tensor([[203652.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(7010497.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145991.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8201e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173671.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(5422785.5000, grad_fn=<MseLossBackward>)
output :  tensor([[249096.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2437e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148709.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(503345.9062, grad_fn=<MseLossBackward>)
output :  tensor([[198186.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(20059902., grad_fn=<MseLossBackward>)
output :  tensor([[162463.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(6315640., grad_fn=<MseLossBackward>)
output :  tensor([[124988.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3682e+09, grad_fn=<MseLossBackward>)
output :  tensor([[134623.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1269213.5000, grad_fn=<MseLossBackward>)
output :  tensor([[182871.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1274394., grad_fn=<MseLossBackward>)
output :  tensor([[198342.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(69601480., grad_fn=<MseLossBackward>)
output :  tensor([[226452.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9122e+09, grad_fn=<MseLossBackward>)
output :  tensor([[247114.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(97732688., grad_fn=<MseLossBackward>)
output :  tensor([[184265.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8153e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143925.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7484e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145070.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(325933.9375, grad_fn=<MseLossBackward>)
output :  tensor([[72074.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0288e+09, grad_fn=<MseLossBackward>)
output :  tensor([[143594.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(73870000., grad_fn=<MseLossBackward>)
output :  tensor([[127653.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1554892.1250, grad_fn=<MseLossBackward>)
output :  tensor([[154341.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(116398.2500, grad_fn=<MseLossBackward>)
output :  tensor([[129923.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(8545939., grad_fn=<MseLossBackward>)
output :  tensor([[77152.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(426174.3750, grad_fn=<MseLossBackward>)
output :  tensor([[81954.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(2039.7925, grad_fn=<MseLossBackward>)
output :  tensor([[235657.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(13374906., grad_fn=<MseLossBackward>)
output :  tensor([[139727.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4135e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131279.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(607133.1875, grad_fn=<MseLossBackward>)
output :  tensor([[167687.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(472849.6250, grad_fn=<MseLossBackward>)
output :  tensor([[232936.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4259580., grad_fn=<MseLossBackward>)
output :  tensor([[191467.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(451773.0312, grad_fn=<MseLossBackward>)
output :  tensor([[152473.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(12437194., grad_fn=<MseLossBackward>)
output :  tensor([[197129.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(593887., grad_fn=<MseLossBackward>)
output :  tensor([[201785.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2401e+09, grad_fn=<MseLossBackward>)
output :  tensor([[138508.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2274394., grad_fn=<MseLossBackward>)
output :  tensor([[154804.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(38305.8281, grad_fn=<MseLossBackward>)
output :  tensor([[135681.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(101302.9531, grad_fn=<MseLossBackward>)
output :  tensor([[197613.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0489e+09, grad_fn=<MseLossBackward>)
output :  tensor([[153625.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(140355.5938, grad_fn=<MseLossBackward>)
output :  tensor([[138715.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0445e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146722.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(3321221.5000, grad_fn=<MseLossBackward>)
output :  tensor([[208269.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(13915931., grad_fn=<MseLossBackward>)
output :  tensor([[102453.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1833e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166745.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(569859.8750, grad_fn=<MseLossBackward>)
output :  tensor([[126426.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2476935., grad_fn=<MseLossBackward>)
output :  tensor([[146007.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(984932.1875, grad_fn=<MseLossBackward>)
output :  tensor([[104824.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8013e+09, grad_fn=<MseLossBackward>)
output :  tensor([[140799.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(10887422., grad_fn=<MseLossBackward>)
output :  tensor([[239936.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(15492342., grad_fn=<MseLossBackward>)
output :  tensor([[144421.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(335023.9062, grad_fn=<MseLossBackward>)
output :  tensor([[139426.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(3711643., grad_fn=<MseLossBackward>)
output :  tensor([[164665.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3444e+09, grad_fn=<MseLossBackward>)
output :  tensor([[267732.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0543e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178060.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(9366278., grad_fn=<MseLossBackward>)
output :  tensor([[103544.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(590892.5000, grad_fn=<MseLossBackward>)
output :  tensor([[199825.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0333e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159803.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(645260.7500, grad_fn=<MseLossBackward>)
output :  tensor([[162502.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6192e+10, grad_fn=<MseLossBackward>)
output :  tensor([[98655.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(126108.2188, grad_fn=<MseLossBackward>)
output :  tensor([[123855.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(65188.4609, grad_fn=<MseLossBackward>)
output :  tensor([[154199.]], grad_fn=<AddmmBackward>)
loss:  tensor(3243601., grad_fn=<MseLossBackward>)
output :  tensor([[140955.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(913308.7500, grad_fn=<MseLossBackward>)
output :  tensor([[201655.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2740369.7500, grad_fn=<MseLossBackward>)
output :  tensor([[140654.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1809655.5000, grad_fn=<MseLossBackward>)
output :  tensor([[260806.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2170005.2500, grad_fn=<MseLossBackward>)
output :  tensor([[127283.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1754e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166401.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(813096.6875, grad_fn=<MseLossBackward>)
output :  tensor([[190541.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(4166382.5000, grad_fn=<MseLossBackward>)
output :  tensor([[124053.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9750e+08, grad_fn=<MseLossBackward>)
output :  tensor([[252549.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(6501942., grad_fn=<MseLossBackward>)
output :  tensor([[156867.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(9.0795e+08, grad_fn=<MseLossBackward>)
output :  tensor([[243584.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3118645.7500, grad_fn=<MseLossBackward>)
output :  tensor([[147198.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(10228403., grad_fn=<MseLossBackward>)
output :  tensor([[211861.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(3465589.5000, grad_fn=<MseLossBackward>)
output :  tensor([[176861.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(19903448., grad_fn=<MseLossBackward>)
output :  tensor([[154457.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(209149.0156, grad_fn=<MseLossBackward>)
output :  tensor([[117838.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(26044.4121, grad_fn=<MseLossBackward>)
output :  tensor([[239118.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3013e+09, grad_fn=<MseLossBackward>)
output :  tensor([[240088.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(7918.2188, grad_fn=<MseLossBackward>)
output :  tensor([[151759.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2489443., grad_fn=<MseLossBackward>)
output :  tensor([[256059.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1344440.2500, grad_fn=<MseLossBackward>)
output :  tensor([[123046.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(72974304., grad_fn=<MseLossBackward>)
output :  tensor([[177956.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3827770., grad_fn=<MseLossBackward>)
output :  tensor([[161104.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1219989.2500, grad_fn=<MseLossBackward>)
output :  tensor([[132362.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1856363.6250, grad_fn=<MseLossBackward>)
output :  tensor([[195542.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3617e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163673.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(106755.3516, grad_fn=<MseLossBackward>)
output :  tensor([[165773.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(7689789., grad_fn=<MseLossBackward>)
output :  tensor([[155416.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(6672050.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144587.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(28222822., grad_fn=<MseLossBackward>)
output :  tensor([[174672.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2474e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159459.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(292072.6875, grad_fn=<MseLossBackward>)
output :  tensor([[370815.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7304e+08, grad_fn=<MseLossBackward>)
output :  tensor([[122277.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(22299276., grad_fn=<MseLossBackward>)
output :  tensor([[131199.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0885e+09, grad_fn=<MseLossBackward>)
output :  tensor([[279676.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2362273., grad_fn=<MseLossBackward>)
output :  tensor([[162549.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(302276.5938, grad_fn=<MseLossBackward>)
output :  tensor([[131570.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2256e+08, grad_fn=<MseLossBackward>)
output :  tensor([[229318.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(7190610., grad_fn=<MseLossBackward>)
output :  tensor([[182854.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(5545215.5000, grad_fn=<MseLossBackward>)
output :  tensor([[154404.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(5781770.5000, grad_fn=<MseLossBackward>)
output :  tensor([[142868.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(4543225.5000, grad_fn=<MseLossBackward>)
output :  tensor([[155019.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2832e+08, grad_fn=<MseLossBackward>)
output :  tensor([[102302.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(5301830., grad_fn=<MseLossBackward>)
output :  tensor([[79979.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9919e+08, grad_fn=<MseLossBackward>)
output :  tensor([[161961.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(9234286., grad_fn=<MseLossBackward>)
output :  tensor([[186653.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7095e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158595.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(354620.2500, grad_fn=<MseLossBackward>)
output :  tensor([[160696.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(10217113., grad_fn=<MseLossBackward>)
output :  tensor([[136342.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1225552.7500, grad_fn=<MseLossBackward>)
output :  tensor([[208517.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(6590853., grad_fn=<MseLossBackward>)
output :  tensor([[137646.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(125227.5156, grad_fn=<MseLossBackward>)
output :  tensor([[181515.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6508e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143678.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(5387621.5000, grad_fn=<MseLossBackward>)
output :  tensor([[110933.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8029e+08, grad_fn=<MseLossBackward>)
output :  tensor([[89539.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(19896408., grad_fn=<MseLossBackward>)
output :  tensor([[175258.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(66862.6484, grad_fn=<MseLossBackward>)
output :  tensor([[254715.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(32317804., grad_fn=<MseLossBackward>)
output :  tensor([[141256.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(59360.7539, grad_fn=<MseLossBackward>)
output :  tensor([[159258.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(405490.3750, grad_fn=<MseLossBackward>)
output :  tensor([[132799.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(89644.1016, grad_fn=<MseLossBackward>)
output :  tensor([[142956.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(42813916., grad_fn=<MseLossBackward>)
output :  tensor([[169008.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1229257.2500, grad_fn=<MseLossBackward>)
output :  tensor([[127773.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(598616.5000, grad_fn=<MseLossBackward>)
output :  tensor([[171954.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2656e+08, grad_fn=<MseLossBackward>)
output :  tensor([[156905.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(8989.4102, grad_fn=<MseLossBackward>)
output :  tensor([[114685.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(3293601., grad_fn=<MseLossBackward>)
output :  tensor([[159474.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4061e+09, grad_fn=<MseLossBackward>)
output :  tensor([[52952.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(907955.8750, grad_fn=<MseLossBackward>)
output :  tensor([[231660.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5350e+09, grad_fn=<MseLossBackward>)
output :  tensor([[200205.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(631553.0625, grad_fn=<MseLossBackward>)
output :  tensor([[182109.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(8356435.5000, grad_fn=<MseLossBackward>)
output :  tensor([[106020.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(410.3790, grad_fn=<MseLossBackward>)
output :  tensor([[87378.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(142943.0625, grad_fn=<MseLossBackward>)
output :  tensor([[141319.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1740296.8750, grad_fn=<MseLossBackward>)
output :  tensor([[217138.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9077e+09, grad_fn=<MseLossBackward>)
output :  tensor([[200752.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(45531708., grad_fn=<MseLossBackward>)
output :  tensor([[162443.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(6534733.5000, grad_fn=<MseLossBackward>)
output :  tensor([[172600.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5377e+09, grad_fn=<MseLossBackward>)
output :  tensor([[191312.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1721426., grad_fn=<MseLossBackward>)
output :  tensor([[89722.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(7410900.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139091.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(825315.5000, grad_fn=<MseLossBackward>)
output :  tensor([[108874.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2643113.7500, grad_fn=<MseLossBackward>)
output :  tensor([[148625.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6040e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172297.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7055e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192845.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4773e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178369.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2657002., grad_fn=<MseLossBackward>)
output :  tensor([[97060.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(314493.1250, grad_fn=<MseLossBackward>)
output :  tensor([[118067.]], grad_fn=<AddmmBackward>)
loss:  tensor(321489., grad_fn=<MseLossBackward>)
output :  tensor([[160414.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5626e+08, grad_fn=<MseLossBackward>)
output :  tensor([[196782.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(10354217., grad_fn=<MseLossBackward>)
output :  tensor([[144648.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(419985., grad_fn=<MseLossBackward>)
train_loss: [2.6317338e+09]
epoch_result tensor([0.])
output :  tensor([[157656.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(711202.3125, grad_fn=<MseLossBackward>)
output :  tensor([[123364.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(1861497.8750, grad_fn=<MseLossBackward>)
output :  tensor([[195525.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1753927.7500, grad_fn=<MseLossBackward>)
output :  tensor([[175371.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2652724.7500, grad_fn=<MseLossBackward>)
output :  tensor([[153200.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1500e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131480.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(12112901., grad_fn=<MseLossBackward>)
output :  tensor([[140593.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(164899.4375, grad_fn=<MseLossBackward>)
output :  tensor([[119196.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(38676.7539, grad_fn=<MseLossBackward>)
output :  tensor([[68835.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0681e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165829.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(29022.3164, grad_fn=<MseLossBackward>)
output :  tensor([[143954.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(15638935., grad_fn=<MseLossBackward>)
output :  tensor([[224261.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(545151.5000, grad_fn=<MseLossBackward>)
output :  tensor([[168784.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(46514.3594, grad_fn=<MseLossBackward>)
output :  tensor([[249927.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(51955.5039, grad_fn=<MseLossBackward>)
output :  tensor([[57704.0586]], grad_fn=<AddmmBackward>)
loss:  tensor(7311933., grad_fn=<MseLossBackward>)
output :  tensor([[162968.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4110e+08, grad_fn=<MseLossBackward>)
output :  tensor([[169693.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(28159606., grad_fn=<MseLossBackward>)
output :  tensor([[167675.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2489e+08, grad_fn=<MseLossBackward>)
output :  tensor([[273231.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(3126487., grad_fn=<MseLossBackward>)
output :  tensor([[195246.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(3073995.2500, grad_fn=<MseLossBackward>)
output :  tensor([[138336.]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5166e+10, grad_fn=<MseLossBackward>)
output :  tensor([[197102.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(10393471., grad_fn=<MseLossBackward>)
output :  tensor([[176840.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3097e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151720.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(518985.1562, grad_fn=<MseLossBackward>)
output :  tensor([[168399.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2562300.5000, grad_fn=<MseLossBackward>)
output :  tensor([[85212.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(35021.6133, grad_fn=<MseLossBackward>)
output :  tensor([[169248.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1639e+09, grad_fn=<MseLossBackward>)
output :  tensor([[184789.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(44441.9102, grad_fn=<MseLossBackward>)
output :  tensor([[204553.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5955e+09, grad_fn=<MseLossBackward>)
output :  tensor([[111362.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1855469.6250, grad_fn=<MseLossBackward>)
output :  tensor([[172099.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1209140.7500, grad_fn=<MseLossBackward>)
output :  tensor([[135916.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(340344.6250, grad_fn=<MseLossBackward>)
output :  tensor([[130955.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(3823735.7500, grad_fn=<MseLossBackward>)
output :  tensor([[121162.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(2764763.5000, grad_fn=<MseLossBackward>)
output :  tensor([[146352.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(8.6154e+08, grad_fn=<MseLossBackward>)
output :  tensor([[168243.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1537e+10, grad_fn=<MseLossBackward>)
output :  tensor([[151817.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(4482284.5000, grad_fn=<MseLossBackward>)
output :  tensor([[178040.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3840558.7500, grad_fn=<MseLossBackward>)
output :  tensor([[140361.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(407422.9062, grad_fn=<MseLossBackward>)
output :  tensor([[107553.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0813e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134285.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5149e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146510.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3249e+08, grad_fn=<MseLossBackward>)
output :  tensor([[138905.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4175e+08, grad_fn=<MseLossBackward>)
output :  tensor([[223754.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1551776.2500, grad_fn=<MseLossBackward>)
output :  tensor([[131586.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(440875.2500, grad_fn=<MseLossBackward>)
output :  tensor([[147367.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2664291., grad_fn=<MseLossBackward>)
output :  tensor([[109634.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(5593336., grad_fn=<MseLossBackward>)
output :  tensor([[160245.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(60185.8906, grad_fn=<MseLossBackward>)
output :  tensor([[147991.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2098e+09, grad_fn=<MseLossBackward>)
output :  tensor([[191952.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2222.2385, grad_fn=<MseLossBackward>)
output :  tensor([[136165.]], grad_fn=<AddmmBackward>)
loss:  tensor(2941225., grad_fn=<MseLossBackward>)
output :  tensor([[110310.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(96211.4375, grad_fn=<MseLossBackward>)
output :  tensor([[232431.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2458722., grad_fn=<MseLossBackward>)
output :  tensor([[164568.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3933e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158351.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(420248.3125, grad_fn=<MseLossBackward>)
output :  tensor([[203199.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8663e+10, grad_fn=<MseLossBackward>)
output :  tensor([[243734.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2158e+10, grad_fn=<MseLossBackward>)
output :  tensor([[147002.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(12270900., grad_fn=<MseLossBackward>)
output :  tensor([[132009.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(3963521., grad_fn=<MseLossBackward>)
output :  tensor([[152783.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(4913565., grad_fn=<MseLossBackward>)
output :  tensor([[133733.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(13937739., grad_fn=<MseLossBackward>)
output :  tensor([[182709.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9739e+09, grad_fn=<MseLossBackward>)
output :  tensor([[182810.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1662367., grad_fn=<MseLossBackward>)
output :  tensor([[162370.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(757443.8750, grad_fn=<MseLossBackward>)
output :  tensor([[144303.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1700171.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144935.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(5930290.5000, grad_fn=<MseLossBackward>)
output :  tensor([[146748.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(3056050.2500, grad_fn=<MseLossBackward>)
output :  tensor([[173563.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3722e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194242.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1791e+08, grad_fn=<MseLossBackward>)
output :  tensor([[139942.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(11849946., grad_fn=<MseLossBackward>)
output :  tensor([[176616.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(22243456., grad_fn=<MseLossBackward>)
output :  tensor([[181668.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(447163.8750, grad_fn=<MseLossBackward>)
output :  tensor([[115562.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(315966.9375, grad_fn=<MseLossBackward>)
output :  tensor([[217228.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(14225273., grad_fn=<MseLossBackward>)
output :  tensor([[183673.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(30042.6387, grad_fn=<MseLossBackward>)
output :  tensor([[125525.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(670.7291, grad_fn=<MseLossBackward>)
output :  tensor([[195857.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(413027.1250, grad_fn=<MseLossBackward>)
output :  tensor([[176938.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(4153826.2500, grad_fn=<MseLossBackward>)
output :  tensor([[206292.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2385e+10, grad_fn=<MseLossBackward>)
output :  tensor([[210796.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(41437.6914, grad_fn=<MseLossBackward>)
output :  tensor([[170032.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5235e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194882.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(146186.7500, grad_fn=<MseLossBackward>)
output :  tensor([[112702.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(88417.9531, grad_fn=<MseLossBackward>)
output :  tensor([[114479.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(3918605.7500, grad_fn=<MseLossBackward>)
output :  tensor([[113866.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(3482160., grad_fn=<MseLossBackward>)
output :  tensor([[148432.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2666025.7500, grad_fn=<MseLossBackward>)
output :  tensor([[162001.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2631e+10, grad_fn=<MseLossBackward>)
output :  tensor([[180067.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(4547.8164, grad_fn=<MseLossBackward>)
output :  tensor([[127931.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(186225.9688, grad_fn=<MseLossBackward>)
output :  tensor([[144037.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(927098.1875, grad_fn=<MseLossBackward>)
output :  tensor([[183553.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3672e+09, grad_fn=<MseLossBackward>)
output :  tensor([[119652.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(7574450., grad_fn=<MseLossBackward>)
output :  tensor([[190917.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(36993196., grad_fn=<MseLossBackward>)
output :  tensor([[146106.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1224999.3750, grad_fn=<MseLossBackward>)
output :  tensor([[210328.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(6615023.5000, grad_fn=<MseLossBackward>)
output :  tensor([[126046.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2130.3994, grad_fn=<MseLossBackward>)
output :  tensor([[243810.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(20411054., grad_fn=<MseLossBackward>)
output :  tensor([[237860.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2221e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151829.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1735e+08, grad_fn=<MseLossBackward>)
output :  tensor([[85860.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1802e+08, grad_fn=<MseLossBackward>)
output :  tensor([[191744.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9149e+09, grad_fn=<MseLossBackward>)
output :  tensor([[82760.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(3100790.7500, grad_fn=<MseLossBackward>)
output :  tensor([[141326.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(3336444.7500, grad_fn=<MseLossBackward>)
output :  tensor([[77342.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(3394720., grad_fn=<MseLossBackward>)
output :  tensor([[144098.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1312635.6250, grad_fn=<MseLossBackward>)
output :  tensor([[177034.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1069285.2500, grad_fn=<MseLossBackward>)
output :  tensor([[152368.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1281247.1250, grad_fn=<MseLossBackward>)
output :  tensor([[107348.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2649.0322, grad_fn=<MseLossBackward>)
output :  tensor([[204301.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2421e+10, grad_fn=<MseLossBackward>)
output :  tensor([[127539.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(921750., grad_fn=<MseLossBackward>)
output :  tensor([[271049.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(80106976., grad_fn=<MseLossBackward>)
output :  tensor([[304259.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(32947958., grad_fn=<MseLossBackward>)
output :  tensor([[108843.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1805622.1250, grad_fn=<MseLossBackward>)
output :  tensor([[170999.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2252016., grad_fn=<MseLossBackward>)
output :  tensor([[133477.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4910e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131459.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(56861968., grad_fn=<MseLossBackward>)
output :  tensor([[129520.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(532158.8750, grad_fn=<MseLossBackward>)
output :  tensor([[127544.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(6474202., grad_fn=<MseLossBackward>)
output :  tensor([[135636.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8312e+08, grad_fn=<MseLossBackward>)
output :  tensor([[227371.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8271e+10, grad_fn=<MseLossBackward>)
output :  tensor([[188863.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3145e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144885.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(970933.1250, grad_fn=<MseLossBackward>)
output :  tensor([[135273.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(60425360., grad_fn=<MseLossBackward>)
output :  tensor([[112779.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2338127.7500, grad_fn=<MseLossBackward>)
output :  tensor([[255530.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9101e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137118.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(4486917., grad_fn=<MseLossBackward>)
output :  tensor([[203288.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(83268.3125, grad_fn=<MseLossBackward>)
output :  tensor([[102564.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(5456859.5000, grad_fn=<MseLossBackward>)
output :  tensor([[141406.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2121665.2500, grad_fn=<MseLossBackward>)
output :  tensor([[206705.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1664e+08, grad_fn=<MseLossBackward>)
output :  tensor([[183736.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(14716215., grad_fn=<MseLossBackward>)
output :  tensor([[184755.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(60002.0352, grad_fn=<MseLossBackward>)
output :  tensor([[162938.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1334e+10, grad_fn=<MseLossBackward>)
output :  tensor([[296294.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4981e+09, grad_fn=<MseLossBackward>)
output :  tensor([[196442.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2124124., grad_fn=<MseLossBackward>)
output :  tensor([[258791.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0756e+10, grad_fn=<MseLossBackward>)
output :  tensor([[219424.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1692e+09, grad_fn=<MseLossBackward>)
output :  tensor([[279584.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3999e+09, grad_fn=<MseLossBackward>)
output :  tensor([[225480.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2192296.7500, grad_fn=<MseLossBackward>)
output :  tensor([[222479.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8737e+10, grad_fn=<MseLossBackward>)
output :  tensor([[197313.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(98037.4844, grad_fn=<MseLossBackward>)
output :  tensor([[159854.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(9.5197e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134781.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(5205028.5000, grad_fn=<MseLossBackward>)
output :  tensor([[134212.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1656771.2500, grad_fn=<MseLossBackward>)
output :  tensor([[90477.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(272989.9375, grad_fn=<MseLossBackward>)
output :  tensor([[112916.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(24174968., grad_fn=<MseLossBackward>)
output :  tensor([[272463.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1850e+09, grad_fn=<MseLossBackward>)
output :  tensor([[236463.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2140826.2500, grad_fn=<MseLossBackward>)
output :  tensor([[147219.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(4924238.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140346.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(8100872., grad_fn=<MseLossBackward>)
output :  tensor([[172551.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1396976.2500, grad_fn=<MseLossBackward>)
output :  tensor([[144621.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(394599.9062, grad_fn=<MseLossBackward>)
output :  tensor([[164641.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(8.9152e+08, grad_fn=<MseLossBackward>)
output :  tensor([[164471.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(279477.4375, grad_fn=<MseLossBackward>)
output :  tensor([[136615.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(148068.6406, grad_fn=<MseLossBackward>)
output :  tensor([[191699.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7886e+09, grad_fn=<MseLossBackward>)
output :  tensor([[111900.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(9954.7393, grad_fn=<MseLossBackward>)
output :  tensor([[167616.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(19211922., grad_fn=<MseLossBackward>)
output :  tensor([[119691.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(95268.6797, grad_fn=<MseLossBackward>)
output :  tensor([[85037.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(3850762.2500, grad_fn=<MseLossBackward>)
output :  tensor([[179747.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(63850.9727, grad_fn=<MseLossBackward>)
output :  tensor([[110582.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(466243.5938, grad_fn=<MseLossBackward>)
output :  tensor([[244256.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(27634406., grad_fn=<MseLossBackward>)
output :  tensor([[248574.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(12777832., grad_fn=<MseLossBackward>)
output :  tensor([[127420.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(4325360., grad_fn=<MseLossBackward>)
output :  tensor([[111831.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(8249820., grad_fn=<MseLossBackward>)
output :  tensor([[287706.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2334e+10, grad_fn=<MseLossBackward>)
output :  tensor([[170073.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2035793.8750, grad_fn=<MseLossBackward>)
output :  tensor([[123498.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2253282.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145334.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4719e+08, grad_fn=<MseLossBackward>)
output :  tensor([[200573.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8028e+08, grad_fn=<MseLossBackward>)
output :  tensor([[141416.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(173706.6094, grad_fn=<MseLossBackward>)
output :  tensor([[158069.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4867e+10, grad_fn=<MseLossBackward>)
output :  tensor([[150524.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(11396216., grad_fn=<MseLossBackward>)
output :  tensor([[130004.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(254488.7188, grad_fn=<MseLossBackward>)
output :  tensor([[245383.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7720e+10, grad_fn=<MseLossBackward>)
output :  tensor([[399687.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(5348090., grad_fn=<MseLossBackward>)
output :  tensor([[105454.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(12572786., grad_fn=<MseLossBackward>)
output :  tensor([[112236.1016]], grad_fn=<AddmmBackward>)
loss:  tensor(39236424., grad_fn=<MseLossBackward>)
output :  tensor([[156363.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(9835182., grad_fn=<MseLossBackward>)
output :  tensor([[133750.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1003e+08, grad_fn=<MseLossBackward>)
output :  tensor([[161840.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6191e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174188.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1201e+09, grad_fn=<MseLossBackward>)
output :  tensor([[103827.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(51681.6289, grad_fn=<MseLossBackward>)
output :  tensor([[138534.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(6077997., grad_fn=<MseLossBackward>)
output :  tensor([[363903.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(11494007., grad_fn=<MseLossBackward>)
output :  tensor([[202667.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6351e+09, grad_fn=<MseLossBackward>)
output :  tensor([[176759.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1585159.7500, grad_fn=<MseLossBackward>)
output :  tensor([[200384.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(6326718.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139767.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(589800., grad_fn=<MseLossBackward>)
output :  tensor([[192540.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(3838477., grad_fn=<MseLossBackward>)
output :  tensor([[137534.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(9.0210e+08, grad_fn=<MseLossBackward>)
output :  tensor([[183311.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(5343465.5000, grad_fn=<MseLossBackward>)
output :  tensor([[242754.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(569199.5000, grad_fn=<MseLossBackward>)
output :  tensor([[174408.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(167268.2188, grad_fn=<MseLossBackward>)
output :  tensor([[108955.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(912786.1875, grad_fn=<MseLossBackward>)
output :  tensor([[265376.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(664530.6875, grad_fn=<MseLossBackward>)
output :  tensor([[251743.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(3041209., grad_fn=<MseLossBackward>)
output :  tensor([[128743.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(32987612., grad_fn=<MseLossBackward>)
output :  tensor([[214042.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7158e+09, grad_fn=<MseLossBackward>)
output :  tensor([[303948.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5590e+08, grad_fn=<MseLossBackward>)
output :  tensor([[209447.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(5991633., grad_fn=<MseLossBackward>)
output :  tensor([[212391.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6284e+10, grad_fn=<MseLossBackward>)
output :  tensor([[160558.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(7069034.5000, grad_fn=<MseLossBackward>)
output :  tensor([[170402.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(170182.0312, grad_fn=<MseLossBackward>)
output :  tensor([[162635.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(32524922., grad_fn=<MseLossBackward>)
output :  tensor([[166649.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(11228468., grad_fn=<MseLossBackward>)
output :  tensor([[234849.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0990e+09, grad_fn=<MseLossBackward>)
output :  tensor([[218493.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2018e+08, grad_fn=<MseLossBackward>)
output :  tensor([[161619.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1373e+08, grad_fn=<MseLossBackward>)
output :  tensor([[120690.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(5334295.5000, grad_fn=<MseLossBackward>)
output :  tensor([[178300.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1691950.5000, grad_fn=<MseLossBackward>)
output :  tensor([[180233.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3627e+09, grad_fn=<MseLossBackward>)
output :  tensor([[206266.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5476e+10, grad_fn=<MseLossBackward>)
output :  tensor([[135260.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(686515.8125, grad_fn=<MseLossBackward>)
output :  tensor([[149796.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9506e+08, grad_fn=<MseLossBackward>)
output :  tensor([[270766.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(38861196., grad_fn=<MseLossBackward>)
output :  tensor([[86572.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(2473174., grad_fn=<MseLossBackward>)
output :  tensor([[240215.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(13807146., grad_fn=<MseLossBackward>)
output :  tensor([[258534.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0523e+11, grad_fn=<MseLossBackward>)
output :  tensor([[170671.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(451185.0938, grad_fn=<MseLossBackward>)
output :  tensor([[192443.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8110e+09, grad_fn=<MseLossBackward>)
output :  tensor([[154389.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(372653.0312, grad_fn=<MseLossBackward>)
output :  tensor([[205349.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1796e+09, grad_fn=<MseLossBackward>)
output :  tensor([[127534.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(2148995.7500, grad_fn=<MseLossBackward>)
output :  tensor([[147409.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(5803431.5000, grad_fn=<MseLossBackward>)
output :  tensor([[171468.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3916e+08, grad_fn=<MseLossBackward>)
output :  tensor([[184918.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(867372.0625, grad_fn=<MseLossBackward>)
output :  tensor([[129955.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(15648514., grad_fn=<MseLossBackward>)
output :  tensor([[139345.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(8094736.5000, grad_fn=<MseLossBackward>)
output :  tensor([[170154.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(8094914., grad_fn=<MseLossBackward>)
output :  tensor([[198191.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6841e+09, grad_fn=<MseLossBackward>)
output :  tensor([[238852.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(17202922., grad_fn=<MseLossBackward>)
output :  tensor([[152717.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(5212017.5000, grad_fn=<MseLossBackward>)
output :  tensor([[197744.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(3044152.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163761.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9053e+08, grad_fn=<MseLossBackward>)
output :  tensor([[170628.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(78699080., grad_fn=<MseLossBackward>)
output :  tensor([[182717.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(7936369.5000, grad_fn=<MseLossBackward>)
output :  tensor([[99884.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(8321422., grad_fn=<MseLossBackward>)
output :  tensor([[172933.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1463e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134996.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(11.6025, grad_fn=<MseLossBackward>)
output :  tensor([[120804.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(33688320., grad_fn=<MseLossBackward>)
output :  tensor([[174286.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(81992.7422, grad_fn=<MseLossBackward>)
output :  tensor([[84611.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(151308.8438, grad_fn=<MseLossBackward>)
output :  tensor([[280782.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(84964032., grad_fn=<MseLossBackward>)
output :  tensor([[170022.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(25222210., grad_fn=<MseLossBackward>)
output :  tensor([[189934.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0516e+10, grad_fn=<MseLossBackward>)
output :  tensor([[243931.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3272e+08, grad_fn=<MseLossBackward>)
output :  tensor([[149580.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2014980.2500, grad_fn=<MseLossBackward>)
output :  tensor([[123879.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(14428.1387, grad_fn=<MseLossBackward>)
output :  tensor([[118340.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2433112.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144293.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5813e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175744.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(3042789.7500, grad_fn=<MseLossBackward>)
output :  tensor([[110348.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7554e+08, grad_fn=<MseLossBackward>)
output :  tensor([[209131.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1852e+10, grad_fn=<MseLossBackward>)
output :  tensor([[243113.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2603180.5000, grad_fn=<MseLossBackward>)
output :  tensor([[249013.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1368e+10, grad_fn=<MseLossBackward>)
output :  tensor([[221766.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9698e+08, grad_fn=<MseLossBackward>)
output :  tensor([[193720.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4830e+10, grad_fn=<MseLossBackward>)
output :  tensor([[189064.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2447758., grad_fn=<MseLossBackward>)
output :  tensor([[205424.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8157e+10, grad_fn=<MseLossBackward>)
output :  tensor([[187760.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1975e+10, grad_fn=<MseLossBackward>)
output :  tensor([[174042.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(22069002., grad_fn=<MseLossBackward>)
output :  tensor([[154361.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(5578453.5000, grad_fn=<MseLossBackward>)
output :  tensor([[336491.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(258604.0312, grad_fn=<MseLossBackward>)
output :  tensor([[211149.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(723536.3125, grad_fn=<MseLossBackward>)
output :  tensor([[159668.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(109871.5312, grad_fn=<MseLossBackward>)
output :  tensor([[186959.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9747e+09, grad_fn=<MseLossBackward>)
output :  tensor([[105806.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(650782.5625, grad_fn=<MseLossBackward>)
output :  tensor([[273068.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9486e+10, grad_fn=<MseLossBackward>)
output :  tensor([[171161.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(7500837., grad_fn=<MseLossBackward>)
output :  tensor([[206030.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(55791796., grad_fn=<MseLossBackward>)
output :  tensor([[205158.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5096e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177845.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1834035.3750, grad_fn=<MseLossBackward>)
output :  tensor([[198557.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(10516441., grad_fn=<MseLossBackward>)
output :  tensor([[156080.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1167075.1250, grad_fn=<MseLossBackward>)
output :  tensor([[148773.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3789e+09, grad_fn=<MseLossBackward>)
output :  tensor([[118800.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(90093.7734, grad_fn=<MseLossBackward>)
output :  tensor([[140237.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(56554.7852, grad_fn=<MseLossBackward>)
output :  tensor([[148488.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(261536.3594, grad_fn=<MseLossBackward>)
output :  tensor([[200210.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6330e+10, grad_fn=<MseLossBackward>)
output :  tensor([[159755.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(65184.4727, grad_fn=<MseLossBackward>)
output :  tensor([[103535.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(16285702., grad_fn=<MseLossBackward>)
output :  tensor([[223635.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6781e+08, grad_fn=<MseLossBackward>)
output :  tensor([[186065.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2295e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174369.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(4473820., grad_fn=<MseLossBackward>)
output :  tensor([[80244.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(3082521., grad_fn=<MseLossBackward>)
output :  tensor([[128329.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(29208.9453, grad_fn=<MseLossBackward>)
output :  tensor([[217436.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(11808244., grad_fn=<MseLossBackward>)
output :  tensor([[142492.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2272367.7500, grad_fn=<MseLossBackward>)
output :  tensor([[128483.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2300009.2500, grad_fn=<MseLossBackward>)
output :  tensor([[144127.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2331967.5000, grad_fn=<MseLossBackward>)
output :  tensor([[179714.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7821e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144970.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(941597.3125, grad_fn=<MseLossBackward>)
output :  tensor([[159149.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(722978.1875, grad_fn=<MseLossBackward>)
output :  tensor([[213721.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1634322.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138990.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1554e+09, grad_fn=<MseLossBackward>)
output :  tensor([[258167.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(10035234., grad_fn=<MseLossBackward>)
output :  tensor([[155329.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(17392680., grad_fn=<MseLossBackward>)
output :  tensor([[128146.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(124951.2031, grad_fn=<MseLossBackward>)
output :  tensor([[95278.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(77362.2109, grad_fn=<MseLossBackward>)
output :  tensor([[155027.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9741e+09, grad_fn=<MseLossBackward>)
output :  tensor([[177459.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(5954134., grad_fn=<MseLossBackward>)
output :  tensor([[118982.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(2301312.7500, grad_fn=<MseLossBackward>)
output :  tensor([[188126.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6665e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145433.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3472e+09, grad_fn=<MseLossBackward>)
output :  tensor([[148514.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1919090.7500, grad_fn=<MseLossBackward>)
output :  tensor([[187789.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1593.7561, grad_fn=<MseLossBackward>)
output :  tensor([[252674.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6323e+09, grad_fn=<MseLossBackward>)
output :  tensor([[91423.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(5824.7900, grad_fn=<MseLossBackward>)
output :  tensor([[239095.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(818346.3750, grad_fn=<MseLossBackward>)
output :  tensor([[128966.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(217775.3438, grad_fn=<MseLossBackward>)
output :  tensor([[165295.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0121e+10, grad_fn=<MseLossBackward>)
output :  tensor([[113008.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6922e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177949.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(3799210., grad_fn=<MseLossBackward>)
output :  tensor([[163869.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9874e+08, grad_fn=<MseLossBackward>)
output :  tensor([[154020.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5323e+08, grad_fn=<MseLossBackward>)
output :  tensor([[236829.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(4711748.5000, grad_fn=<MseLossBackward>)
output :  tensor([[226107.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0172e+09, grad_fn=<MseLossBackward>)
output :  tensor([[128772.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(3143002.7500, grad_fn=<MseLossBackward>)
output :  tensor([[127102.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1214472.8750, grad_fn=<MseLossBackward>)
output :  tensor([[222878.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(16984960., grad_fn=<MseLossBackward>)
output :  tensor([[229071.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(24291498., grad_fn=<MseLossBackward>)
output :  tensor([[227931.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1516669.2500, grad_fn=<MseLossBackward>)
output :  tensor([[152390.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(19273060., grad_fn=<MseLossBackward>)
output :  tensor([[210221.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(49096.8672, grad_fn=<MseLossBackward>)
output :  tensor([[130515.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1058e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136451.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(15614723., grad_fn=<MseLossBackward>)
output :  tensor([[311382.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(13085854., grad_fn=<MseLossBackward>)
output :  tensor([[142093.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1194922.2500, grad_fn=<MseLossBackward>)
output :  tensor([[122688.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1012e+09, grad_fn=<MseLossBackward>)
output :  tensor([[108774.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(526486.3125, grad_fn=<MseLossBackward>)
output :  tensor([[153497.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6108e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179931.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(8.9859e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173875.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(766336.1250, grad_fn=<MseLossBackward>)
output :  tensor([[192361.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(74622600., grad_fn=<MseLossBackward>)
output :  tensor([[96815.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(10142334., grad_fn=<MseLossBackward>)
output :  tensor([[178144.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(731345.6875, grad_fn=<MseLossBackward>)
output :  tensor([[172319.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(19536262., grad_fn=<MseLossBackward>)
output :  tensor([[141542.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(6466690., grad_fn=<MseLossBackward>)
output :  tensor([[258459.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0129e+10, grad_fn=<MseLossBackward>)
output :  tensor([[141093.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1465e+09, grad_fn=<MseLossBackward>)
output :  tensor([[175000.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(4002062.7500, grad_fn=<MseLossBackward>)
output :  tensor([[139783.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(46899.3164, grad_fn=<MseLossBackward>)
output :  tensor([[195262.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(27435008., grad_fn=<MseLossBackward>)
output :  tensor([[168393.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2579738., grad_fn=<MseLossBackward>)
output :  tensor([[243577.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(178810.0469, grad_fn=<MseLossBackward>)
output :  tensor([[134048.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(203457.3750, grad_fn=<MseLossBackward>)
output :  tensor([[150048.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(488469.9375, grad_fn=<MseLossBackward>)
output :  tensor([[215689.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(475949.0625, grad_fn=<MseLossBackward>)
output :  tensor([[168225.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(10405362., grad_fn=<MseLossBackward>)
output :  tensor([[193533.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(20556448., grad_fn=<MseLossBackward>)
output :  tensor([[134160.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1702e+08, grad_fn=<MseLossBackward>)
output :  tensor([[127775.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1499859.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140154.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(23894.3965, grad_fn=<MseLossBackward>)
output :  tensor([[199843.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8521e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164994.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4994e+09, grad_fn=<MseLossBackward>)
output :  tensor([[77579.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0903e+08, grad_fn=<MseLossBackward>)
output :  tensor([[94693.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0391e+08, grad_fn=<MseLossBackward>)
output :  tensor([[245894.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(54735720., grad_fn=<MseLossBackward>)
output :  tensor([[201766.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9396e+09, grad_fn=<MseLossBackward>)
output :  tensor([[110850.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(17221008., grad_fn=<MseLossBackward>)
output :  tensor([[159793.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6763e+08, grad_fn=<MseLossBackward>)
output :  tensor([[205068.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2296e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177862.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4894e+09, grad_fn=<MseLossBackward>)
output :  tensor([[155619.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(383818.9688, grad_fn=<MseLossBackward>)
output :  tensor([[172516.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(6334895.5000, grad_fn=<MseLossBackward>)
output :  tensor([[115265.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(70361.7109, grad_fn=<MseLossBackward>)
output :  tensor([[163858.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(78479112., grad_fn=<MseLossBackward>)
output :  tensor([[191415.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3976e+08, grad_fn=<MseLossBackward>)
output :  tensor([[218591.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(825996.9375, grad_fn=<MseLossBackward>)
output :  tensor([[246775.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4823e+11, grad_fn=<MseLossBackward>)
output :  tensor([[148909.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3644639., grad_fn=<MseLossBackward>)
output :  tensor([[109475.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(990709.1875, grad_fn=<MseLossBackward>)
output :  tensor([[167422.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0961e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148326.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(4724713.5000, grad_fn=<MseLossBackward>)
output :  tensor([[235402.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2551008., grad_fn=<MseLossBackward>)
output :  tensor([[115768.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(590400.1250, grad_fn=<MseLossBackward>)
output :  tensor([[182945.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2034.8557, grad_fn=<MseLossBackward>)
output :  tensor([[184824.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(3516211., grad_fn=<MseLossBackward>)
output :  tensor([[163275.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4563e+10, grad_fn=<MseLossBackward>)
output :  tensor([[95422.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0801e+08, grad_fn=<MseLossBackward>)
output :  tensor([[239076.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(5854.6406, grad_fn=<MseLossBackward>)
output :  tensor([[175113.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(786491.8125, grad_fn=<MseLossBackward>)
output :  tensor([[140584.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(341713.3125, grad_fn=<MseLossBackward>)
output :  tensor([[234788.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(44725.6406, grad_fn=<MseLossBackward>)
output :  tensor([[166372.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(11375021., grad_fn=<MseLossBackward>)
output :  tensor([[201220.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5321e+10, grad_fn=<MseLossBackward>)
output :  tensor([[135108.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(11860.5713, grad_fn=<MseLossBackward>)
output :  tensor([[185352.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4532e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135418.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(338287.6250, grad_fn=<MseLossBackward>)
output :  tensor([[227823.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(66853876., grad_fn=<MseLossBackward>)
output :  tensor([[222798.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3993e+08, grad_fn=<MseLossBackward>)
output :  tensor([[91768.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(3125851.7500, grad_fn=<MseLossBackward>)
output :  tensor([[158558.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(766035.1875, grad_fn=<MseLossBackward>)
output :  tensor([[245620.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5690e+10, grad_fn=<MseLossBackward>)
output :  tensor([[146589.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2527702.5000, grad_fn=<MseLossBackward>)
output :  tensor([[109461.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8029e+09, grad_fn=<MseLossBackward>)
output :  tensor([[165255.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(570331.7500, grad_fn=<MseLossBackward>)
output :  tensor([[147078.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(9475334., grad_fn=<MseLossBackward>)
output :  tensor([[128597.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(158180.2031, grad_fn=<MseLossBackward>)
output :  tensor([[189625.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8128e+09, grad_fn=<MseLossBackward>)
output :  tensor([[122102.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(157801.3594, grad_fn=<MseLossBackward>)
output :  tensor([[149999.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(4000937.5000, grad_fn=<MseLossBackward>)
output :  tensor([[169397.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(5532712.5000, grad_fn=<MseLossBackward>)
output :  tensor([[151827.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(684032.3750, grad_fn=<MseLossBackward>)
output :  tensor([[158543.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(18976642., grad_fn=<MseLossBackward>)
output :  tensor([[135045.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7837e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134115.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(4474084.5000, grad_fn=<MseLossBackward>)
output :  tensor([[153571.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1233e+08, grad_fn=<MseLossBackward>)
output :  tensor([[144049.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(10541.5137, grad_fn=<MseLossBackward>)
output :  tensor([[165292.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(12547535., grad_fn=<MseLossBackward>)
output :  tensor([[139957.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(9.0345e+08, grad_fn=<MseLossBackward>)
output :  tensor([[150492.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(2864503.2500, grad_fn=<MseLossBackward>)
output :  tensor([[183961.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(16307211., grad_fn=<MseLossBackward>)
output :  tensor([[169608.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(370766.8125, grad_fn=<MseLossBackward>)
output :  tensor([[180423.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(179431.6719, grad_fn=<MseLossBackward>)
output :  tensor([[219911.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(7766.0156, grad_fn=<MseLossBackward>)
output :  tensor([[115050.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(51136576., grad_fn=<MseLossBackward>)
output :  tensor([[138877.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9538e+08, grad_fn=<MseLossBackward>)
output :  tensor([[287051.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1104995.1250, grad_fn=<MseLossBackward>)
output :  tensor([[118216.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(4912907., grad_fn=<MseLossBackward>)
output :  tensor([[176127.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9248e+09, grad_fn=<MseLossBackward>)
output :  tensor([[185771.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(594609.6875, grad_fn=<MseLossBackward>)
output :  tensor([[176609.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(79035992., grad_fn=<MseLossBackward>)
output :  tensor([[250453.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0254e+08, grad_fn=<MseLossBackward>)
output :  tensor([[221249.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(563813.2500, grad_fn=<MseLossBackward>)
output :  tensor([[132871.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2745e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176652.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5945e+08, grad_fn=<MseLossBackward>)
output :  tensor([[123444.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(308745.1875, grad_fn=<MseLossBackward>)
output :  tensor([[182799.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5526e+10, grad_fn=<MseLossBackward>)
output :  tensor([[156918.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(15351581., grad_fn=<MseLossBackward>)
output :  tensor([[155436.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(79862432., grad_fn=<MseLossBackward>)
output :  tensor([[207416.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1246502.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145658.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7316e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175560.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(193462.5312, grad_fn=<MseLossBackward>)
output :  tensor([[248307.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(9.7295e+08, grad_fn=<MseLossBackward>)
output :  tensor([[147198.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(642953.3750, grad_fn=<MseLossBackward>)
output :  tensor([[200785.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(3532696.5000, grad_fn=<MseLossBackward>)
output :  tensor([[157280.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(7125813., grad_fn=<MseLossBackward>)
output :  tensor([[125626.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4157e+09, grad_fn=<MseLossBackward>)
output :  tensor([[138691.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(8653525., grad_fn=<MseLossBackward>)
output :  tensor([[185649.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2719510.2500, grad_fn=<MseLossBackward>)
output :  tensor([[194264.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(18187826., grad_fn=<MseLossBackward>)
output :  tensor([[219537.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8251e+09, grad_fn=<MseLossBackward>)
output :  tensor([[252896.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(16837174., grad_fn=<MseLossBackward>)
output :  tensor([[181776.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8830e+10, grad_fn=<MseLossBackward>)
output :  tensor([[142479.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5989e+09, grad_fn=<MseLossBackward>)
output :  tensor([[142903.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2550359., grad_fn=<MseLossBackward>)
output :  tensor([[73699.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1357e+09, grad_fn=<MseLossBackward>)
output :  tensor([[133574.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2031738.3750, grad_fn=<MseLossBackward>)
output :  tensor([[132263.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(11313448., grad_fn=<MseLossBackward>)
output :  tensor([[154395.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(156271.9688, grad_fn=<MseLossBackward>)
output :  tensor([[127325.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(105818.0547, grad_fn=<MseLossBackward>)
output :  tensor([[75646.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(728142.2500, grad_fn=<MseLossBackward>)
output :  tensor([[85013.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(9082359., grad_fn=<MseLossBackward>)
output :  tensor([[224674.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(53664552., grad_fn=<MseLossBackward>)
output :  tensor([[140455.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8153e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129329.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1369009.7500, grad_fn=<MseLossBackward>)
output :  tensor([[168908.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3640821.7500, grad_fn=<MseLossBackward>)
output :  tensor([[236409.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1985633.2500, grad_fn=<MseLossBackward>)
output :  tensor([[189471.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(7123311., grad_fn=<MseLossBackward>)
output :  tensor([[155029.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(942476.9375, grad_fn=<MseLossBackward>)
output :  tensor([[201144.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(10525057., grad_fn=<MseLossBackward>)
output :  tensor([[202560.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1860e+09, grad_fn=<MseLossBackward>)
output :  tensor([[135763.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1528700.3750, grad_fn=<MseLossBackward>)
output :  tensor([[154592.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(166413., grad_fn=<MseLossBackward>)
output :  tensor([[136901.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(813519.4375, grad_fn=<MseLossBackward>)
output :  tensor([[198911.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6647e+08, grad_fn=<MseLossBackward>)
output :  tensor([[156076.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(4312371.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139941.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1568e+09, grad_fn=<MseLossBackward>)
output :  tensor([[147148.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(5054347., grad_fn=<MseLossBackward>)
output :  tensor([[208159.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(14751721., grad_fn=<MseLossBackward>)
output :  tensor([[104836.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2151e+08, grad_fn=<MseLossBackward>)
output :  tensor([[168812.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1722082.1250, grad_fn=<MseLossBackward>)
output :  tensor([[130116.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(4479109.5000, grad_fn=<MseLossBackward>)
output :  tensor([[147091.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(8400.8682, grad_fn=<MseLossBackward>)
output :  tensor([[103068.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6553e+09, grad_fn=<MseLossBackward>)
output :  tensor([[141481.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(15853711., grad_fn=<MseLossBackward>)
output :  tensor([[235019.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(962330.3750, grad_fn=<MseLossBackward>)
output :  tensor([[146416.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2006118.1250, grad_fn=<MseLossBackward>)
output :  tensor([[138875.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1890668., grad_fn=<MseLossBackward>)
output :  tensor([[164899.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3616e+09, grad_fn=<MseLossBackward>)
output :  tensor([[267708.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0591e+08, grad_fn=<MseLossBackward>)
output :  tensor([[168771.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(38792460., grad_fn=<MseLossBackward>)
output :  tensor([[104656.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(3536045.2500, grad_fn=<MseLossBackward>)
output :  tensor([[200719.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8953e+09, grad_fn=<MseLossBackward>)
output :  tensor([[155083.]], grad_fn=<AddmmBackward>)
loss:  tensor(15342889., grad_fn=<MseLossBackward>)
output :  tensor([[162862.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6037e+10, grad_fn=<MseLossBackward>)
output :  tensor([[97775.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(275100.2500, grad_fn=<MseLossBackward>)
output :  tensor([[123831.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(53530.7773, grad_fn=<MseLossBackward>)
output :  tensor([[158104.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(4428986., grad_fn=<MseLossBackward>)
output :  tensor([[140719.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(517005.9375, grad_fn=<MseLossBackward>)
output :  tensor([[202301.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(5295751.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145126.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(9777445., grad_fn=<MseLossBackward>)
output :  tensor([[265026.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(7541717.5000, grad_fn=<MseLossBackward>)
output :  tensor([[130342.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3945e+09, grad_fn=<MseLossBackward>)
output :  tensor([[165247.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(63827.2852, grad_fn=<MseLossBackward>)
output :  tensor([[186045.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(6025260.5000, grad_fn=<MseLossBackward>)
output :  tensor([[123700.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8769e+08, grad_fn=<MseLossBackward>)
output :  tensor([[250745.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(555467.4375, grad_fn=<MseLossBackward>)
output :  tensor([[157195.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8833e+08, grad_fn=<MseLossBackward>)
output :  tensor([[242562.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(7767978.5000, grad_fn=<MseLossBackward>)
output :  tensor([[141156.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(8086025.5000, grad_fn=<MseLossBackward>)
output :  tensor([[210430.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(184967.1875, grad_fn=<MseLossBackward>)
output :  tensor([[178218.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(33860032., grad_fn=<MseLossBackward>)
output :  tensor([[155291.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1667488., grad_fn=<MseLossBackward>)
output :  tensor([[119428.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2040790.8750, grad_fn=<MseLossBackward>)
output :  tensor([[237520.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4571e+09, grad_fn=<MseLossBackward>)
output :  tensor([[234953.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(25470158., grad_fn=<MseLossBackward>)
output :  tensor([[153583.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(60800.7734, grad_fn=<MseLossBackward>)
output :  tensor([[251912.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(8923009., grad_fn=<MseLossBackward>)
output :  tensor([[122400.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(62357056., grad_fn=<MseLossBackward>)
output :  tensor([[176664.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(441871.7812, grad_fn=<MseLossBackward>)
output :  tensor([[159589.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(168869.6250, grad_fn=<MseLossBackward>)
output :  tensor([[131893.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(798007.2500, grad_fn=<MseLossBackward>)
output :  tensor([[196922.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5459e+09, grad_fn=<MseLossBackward>)
output :  tensor([[165343.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1805076.2500, grad_fn=<MseLossBackward>)
output :  tensor([[163929.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(864493.1875, grad_fn=<MseLossBackward>)
output :  tensor([[156851.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1320129.2500, grad_fn=<MseLossBackward>)
output :  tensor([[151826.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(3710258.5000, grad_fn=<MseLossBackward>)
output :  tensor([[172936.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0241e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159935.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4108.0088, grad_fn=<MseLossBackward>)
output :  tensor([[376181.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(60659760., grad_fn=<MseLossBackward>)
output :  tensor([[136601.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(92187904., grad_fn=<MseLossBackward>)
output :  tensor([[130550.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0295e+09, grad_fn=<MseLossBackward>)
output :  tensor([[281786.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(329009.7812, grad_fn=<MseLossBackward>)
output :  tensor([[161409.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(348524.1875, grad_fn=<MseLossBackward>)
output :  tensor([[131550.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2211e+08, grad_fn=<MseLossBackward>)
output :  tensor([[236845.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(23481142., grad_fn=<MseLossBackward>)
output :  tensor([[177554.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(8673761., grad_fn=<MseLossBackward>)
output :  tensor([[156398.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(19345152., grad_fn=<MseLossBackward>)
output :  tensor([[144359.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(410400.3750, grad_fn=<MseLossBackward>)
output :  tensor([[155788.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5677e+08, grad_fn=<MseLossBackward>)
output :  tensor([[101265.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(1601430.8750, grad_fn=<MseLossBackward>)
output :  tensor([[79975.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9902e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163272.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2985768., grad_fn=<MseLossBackward>)
output :  tensor([[187762.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6190e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161265.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(10665429., grad_fn=<MseLossBackward>)
output :  tensor([[155062.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(5940416., grad_fn=<MseLossBackward>)
output :  tensor([[141273.]], grad_fn=<AddmmBackward>)
loss:  tensor(14615329., grad_fn=<MseLossBackward>)
output :  tensor([[203867.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(4335765., grad_fn=<MseLossBackward>)
output :  tensor([[137895.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(10926.7822, grad_fn=<MseLossBackward>)
output :  tensor([[182418.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6277e+10, grad_fn=<MseLossBackward>)
output :  tensor([[150223.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(17839404., grad_fn=<MseLossBackward>)
output :  tensor([[108495.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5004e+08, grad_fn=<MseLossBackward>)
output :  tensor([[90929.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(9427586., grad_fn=<MseLossBackward>)
output :  tensor([[174881.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(14001.5449, grad_fn=<MseLossBackward>)
output :  tensor([[261192.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(628601.1875, grad_fn=<MseLossBackward>)
output :  tensor([[141656.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(24604.8633, grad_fn=<MseLossBackward>)
output :  tensor([[159048.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(716430., grad_fn=<MseLossBackward>)
output :  tensor([[132511.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(130.1025, grad_fn=<MseLossBackward>)
output :  tensor([[148590.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(827957.8125, grad_fn=<MseLossBackward>)
output :  tensor([[164254.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(13287961., grad_fn=<MseLossBackward>)
output :  tensor([[126470.4922]], grad_fn=<AddmmBackward>)
loss:  tensor(280378.5312, grad_fn=<MseLossBackward>)
output :  tensor([[173840.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3176e+08, grad_fn=<MseLossBackward>)
output :  tensor([[160802.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(14462334., grad_fn=<MseLossBackward>)
output :  tensor([[118078.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2492451.5000, grad_fn=<MseLossBackward>)
output :  tensor([[159530.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3978e+09, grad_fn=<MseLossBackward>)
output :  tensor([[50908.8789]], grad_fn=<AddmmBackward>)
loss:  tensor(1190545.2500, grad_fn=<MseLossBackward>)
output :  tensor([[231961.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4864e+09, grad_fn=<MseLossBackward>)
output :  tensor([[200063.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(877939.7500, grad_fn=<MseLossBackward>)
output :  tensor([[184560.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(192748.4375, grad_fn=<MseLossBackward>)
output :  tensor([[106228.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(52058.8398, grad_fn=<MseLossBackward>)
output :  tensor([[87027.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(775.2744, grad_fn=<MseLossBackward>)
output :  tensor([[132727.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(52888576., grad_fn=<MseLossBackward>)
output :  tensor([[219830.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5011e+09, grad_fn=<MseLossBackward>)
output :  tensor([[201253.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(39018372., grad_fn=<MseLossBackward>)
output :  tensor([[169264.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(18187026., grad_fn=<MseLossBackward>)
output :  tensor([[174430.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2029e+09, grad_fn=<MseLossBackward>)
output :  tensor([[189998.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1174, grad_fn=<MseLossBackward>)
output :  tensor([[85264.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(3010740., grad_fn=<MseLossBackward>)
output :  tensor([[139603.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(157509.7656, grad_fn=<MseLossBackward>)
output :  tensor([[107933.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(6588286., grad_fn=<MseLossBackward>)
output :  tensor([[148761.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6387e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173907.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8411e+09, grad_fn=<MseLossBackward>)
output :  tensor([[191990.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6924e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180377.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(142258.6250, grad_fn=<MseLossBackward>)
output :  tensor([[95822.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(458445.3750, grad_fn=<MseLossBackward>)
output :  tensor([[119172.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2797622., grad_fn=<MseLossBackward>)
output :  tensor([[162086.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8019e+08, grad_fn=<MseLossBackward>)
output :  tensor([[195784.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(17773998., grad_fn=<MseLossBackward>)
output :  tensor([[144257.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(66491.4609, grad_fn=<MseLossBackward>)
train_loss: [2.6308728e+09]
epoch_result tensor([0.])
output :  tensor([[159184.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(468283.5938, grad_fn=<MseLossBackward>)
output :  tensor([[118975.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(9148782., grad_fn=<MseLossBackward>)
output :  tensor([[190998.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(10253104., grad_fn=<MseLossBackward>)
output :  tensor([[177004.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(16.3772, grad_fn=<MseLossBackward>)
output :  tensor([[155292.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1561e+08, grad_fn=<MseLossBackward>)
output :  tensor([[125800.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(4839725., grad_fn=<MseLossBackward>)
output :  tensor([[142744.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(3043116.7500, grad_fn=<MseLossBackward>)
output :  tensor([[120937.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3753058.7500, grad_fn=<MseLossBackward>)
output :  tensor([[70427.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4227e+08, grad_fn=<MseLossBackward>)
output :  tensor([[167987.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(3950591., grad_fn=<MseLossBackward>)
output :  tensor([[138831.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1366451.3750, grad_fn=<MseLossBackward>)
output :  tensor([[224875.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(15550.8691, grad_fn=<MseLossBackward>)
output :  tensor([[166411.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(6701950., grad_fn=<MseLossBackward>)
output :  tensor([[244872.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(23304756., grad_fn=<MseLossBackward>)
output :  tensor([[54746.7852]], grad_fn=<AddmmBackward>)
loss:  tensor(64117.7578, grad_fn=<MseLossBackward>)
output :  tensor([[164531.]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0124e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179310.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(18577716., grad_fn=<MseLossBackward>)
output :  tensor([[157000.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(250562.8125, grad_fn=<MseLossBackward>)
output :  tensor([[277259.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(5103363.5000, grad_fn=<MseLossBackward>)
output :  tensor([[194350.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(7018691., grad_fn=<MseLossBackward>)
output :  tensor([[137001.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5900e+10, grad_fn=<MseLossBackward>)
output :  tensor([[194202.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(104733.1406, grad_fn=<MseLossBackward>)
output :  tensor([[177103.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2845e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151631.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(398279.3125, grad_fn=<MseLossBackward>)
output :  tensor([[174707.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(22157468., grad_fn=<MseLossBackward>)
output :  tensor([[87134.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(3008246.2500, grad_fn=<MseLossBackward>)
output :  tensor([[169831.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2298e+09, grad_fn=<MseLossBackward>)
output :  tensor([[186287.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1658903.7500, grad_fn=<MseLossBackward>)
output :  tensor([[205934.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4568e+09, grad_fn=<MseLossBackward>)
output :  tensor([[114303.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(18516548., grad_fn=<MseLossBackward>)
output :  tensor([[171994.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(989651.9375, grad_fn=<MseLossBackward>)
output :  tensor([[138714.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(4903526., grad_fn=<MseLossBackward>)
output :  tensor([[127487.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2286616.5000, grad_fn=<MseLossBackward>)
output :  tensor([[120661.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1348247.5000, grad_fn=<MseLossBackward>)
output :  tensor([[146387.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(8.6363e+08, grad_fn=<MseLossBackward>)
output :  tensor([[170968.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0745e+10, grad_fn=<MseLossBackward>)
output :  tensor([[149727.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(781.3772, grad_fn=<MseLossBackward>)
output :  tensor([[182721.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(7406137., grad_fn=<MseLossBackward>)
output :  tensor([[142154.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1333916.7500, grad_fn=<MseLossBackward>)
output :  tensor([[103834.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9140e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136204.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2087e+09, grad_fn=<MseLossBackward>)
output :  tensor([[138897.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(15188801., grad_fn=<MseLossBackward>)
output :  tensor([[128811.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(3280513.2500, grad_fn=<MseLossBackward>)
output :  tensor([[223089.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3649413.2500, grad_fn=<MseLossBackward>)
output :  tensor([[134518.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(5146730.5000, grad_fn=<MseLossBackward>)
output :  tensor([[149588.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(345872.6250, grad_fn=<MseLossBackward>)
output :  tensor([[115571.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(12753324., grad_fn=<MseLossBackward>)
output :  tensor([[161815.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(3294792.2500, grad_fn=<MseLossBackward>)
output :  tensor([[142346.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7724e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192186.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(34706.5273, grad_fn=<MseLossBackward>)
output :  tensor([[135537.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1182384.3750, grad_fn=<MseLossBackward>)
output :  tensor([[98039.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4306e+08, grad_fn=<MseLossBackward>)
output :  tensor([[234705.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(498016.9062, grad_fn=<MseLossBackward>)
output :  tensor([[164982.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3530e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166232.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(52312900., grad_fn=<MseLossBackward>)
output :  tensor([[202798.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8798e+10, grad_fn=<MseLossBackward>)
output :  tensor([[241361.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2687e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143787.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(82782.0781, grad_fn=<MseLossBackward>)
output :  tensor([[138750.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(22564726., grad_fn=<MseLossBackward>)
output :  tensor([[156515.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2296645.5000, grad_fn=<MseLossBackward>)
output :  tensor([[129884.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(13358.3027, grad_fn=<MseLossBackward>)
output :  tensor([[183012.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9270e+09, grad_fn=<MseLossBackward>)
output :  tensor([[181126.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(8844490., grad_fn=<MseLossBackward>)
output :  tensor([[157912.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(12870493., grad_fn=<MseLossBackward>)
output :  tensor([[132500.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1023e+08, grad_fn=<MseLossBackward>)
output :  tensor([[143462.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(927308.8125, grad_fn=<MseLossBackward>)
output :  tensor([[141739.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(10629434., grad_fn=<MseLossBackward>)
output :  tensor([[172048.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5749e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193378.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5796e+08, grad_fn=<MseLossBackward>)
output :  tensor([[139732.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(10450774., grad_fn=<MseLossBackward>)
output :  tensor([[169300.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(6757238., grad_fn=<MseLossBackward>)
output :  tensor([[176746.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(18092662., grad_fn=<MseLossBackward>)
output :  tensor([[114042.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(916537., grad_fn=<MseLossBackward>)
output :  tensor([[220019.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(961625.3750, grad_fn=<MseLossBackward>)
output :  tensor([[174270.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(85179344., grad_fn=<MseLossBackward>)
output :  tensor([[126638.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1295790.8750, grad_fn=<MseLossBackward>)
output :  tensor([[198212.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2931639.5000, grad_fn=<MseLossBackward>)
output :  tensor([[177528.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(6906548.5000, grad_fn=<MseLossBackward>)
output :  tensor([[208802.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1488e+10, grad_fn=<MseLossBackward>)
output :  tensor([[210259.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(548895.7500, grad_fn=<MseLossBackward>)
output :  tensor([[169774.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5034e+09, grad_fn=<MseLossBackward>)
output :  tensor([[191082.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(11677811., grad_fn=<MseLossBackward>)
output :  tensor([[112475.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(274805.3125, grad_fn=<MseLossBackward>)
output :  tensor([[114900.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(5763038., grad_fn=<MseLossBackward>)
output :  tensor([[111742.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(66177.5625, grad_fn=<MseLossBackward>)
output :  tensor([[146739.]], grad_fn=<AddmmBackward>)
loss:  tensor(3721., grad_fn=<MseLossBackward>)
output :  tensor([[159681.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3475e+10, grad_fn=<MseLossBackward>)
output :  tensor([[178584.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2002313.5000, grad_fn=<MseLossBackward>)
output :  tensor([[127171.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(107660.8906, grad_fn=<MseLossBackward>)
output :  tensor([[146662.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2764270., grad_fn=<MseLossBackward>)
output :  tensor([[182916.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3056e+09, grad_fn=<MseLossBackward>)
output :  tensor([[118113.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(1471691.2500, grad_fn=<MseLossBackward>)
output :  tensor([[198585.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2512720.2500, grad_fn=<MseLossBackward>)
output :  tensor([[144747.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(63511.8750, grad_fn=<MseLossBackward>)
output :  tensor([[215372.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(6114338., grad_fn=<MseLossBackward>)
output :  tensor([[126904.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(818063.7500, grad_fn=<MseLossBackward>)
output :  tensor([[244671.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(13372620., grad_fn=<MseLossBackward>)
output :  tensor([[239400.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0793e+09, grad_fn=<MseLossBackward>)
output :  tensor([[148192.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8200e+08, grad_fn=<MseLossBackward>)
output :  tensor([[85472.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9889e+08, grad_fn=<MseLossBackward>)
output :  tensor([[191307.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9877e+09, grad_fn=<MseLossBackward>)
output :  tensor([[80406.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(352121.7188, grad_fn=<MseLossBackward>)
output :  tensor([[137445.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(4220970., grad_fn=<MseLossBackward>)
output :  tensor([[78869.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(11351214., grad_fn=<MseLossBackward>)
output :  tensor([[142293.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(435002.0938, grad_fn=<MseLossBackward>)
output :  tensor([[173269.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(7454777., grad_fn=<MseLossBackward>)
output :  tensor([[152066.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2053936.8750, grad_fn=<MseLossBackward>)
output :  tensor([[109841.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(5959968.5000, grad_fn=<MseLossBackward>)
output :  tensor([[202378.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2853e+10, grad_fn=<MseLossBackward>)
output :  tensor([[129372.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(761651.6250, grad_fn=<MseLossBackward>)
output :  tensor([[266308.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8746e+08, grad_fn=<MseLossBackward>)
output :  tensor([[301111.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(78998208., grad_fn=<MseLossBackward>)
output :  tensor([[110339.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(8063780.5000, grad_fn=<MseLossBackward>)
output :  tensor([[170547.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3810609., grad_fn=<MseLossBackward>)
output :  tensor([[134017.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7689e+08, grad_fn=<MseLossBackward>)
output :  tensor([[139676.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(458096.3125, grad_fn=<MseLossBackward>)
output :  tensor([[131058.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(653583.8125, grad_fn=<MseLossBackward>)
output :  tensor([[121684.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(10992851., grad_fn=<MseLossBackward>)
output :  tensor([[134677.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3389e+08, grad_fn=<MseLossBackward>)
output :  tensor([[228095.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7988e+10, grad_fn=<MseLossBackward>)
output :  tensor([[187054.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3699e+10, grad_fn=<MseLossBackward>)
output :  tensor([[140704.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(10210521., grad_fn=<MseLossBackward>)
output :  tensor([[127957.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(209535.0625, grad_fn=<MseLossBackward>)
output :  tensor([[112866.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(2614209., grad_fn=<MseLossBackward>)
output :  tensor([[254243.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0727e+09, grad_fn=<MseLossBackward>)
output :  tensor([[134070.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(863883.1250, grad_fn=<MseLossBackward>)
output :  tensor([[203519.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(269734.1562, grad_fn=<MseLossBackward>)
output :  tensor([[105850.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(903940.4375, grad_fn=<MseLossBackward>)
output :  tensor([[139578.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(138000.6406, grad_fn=<MseLossBackward>)
output :  tensor([[207240.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9789e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178951.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(898852.1250, grad_fn=<MseLossBackward>)
output :  tensor([[187784.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(7751700., grad_fn=<MseLossBackward>)
output :  tensor([[162468.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1471e+10, grad_fn=<MseLossBackward>)
output :  tensor([[291824.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8641e+09, grad_fn=<MseLossBackward>)
output :  tensor([[198109.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(44067.1953, grad_fn=<MseLossBackward>)
output :  tensor([[262813.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9613e+10, grad_fn=<MseLossBackward>)
output :  tensor([[219234.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1870e+09, grad_fn=<MseLossBackward>)
output :  tensor([[277354.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5718e+09, grad_fn=<MseLossBackward>)
output :  tensor([[225966.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(3865831.7500, grad_fn=<MseLossBackward>)
output :  tensor([[222201.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8831e+10, grad_fn=<MseLossBackward>)
output :  tensor([[188591.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(70707600., grad_fn=<MseLossBackward>)
output :  tensor([[159539.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(9.3263e+08, grad_fn=<MseLossBackward>)
output :  tensor([[132330.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(28788.5449, grad_fn=<MseLossBackward>)
output :  tensor([[136022.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(272989.9375, grad_fn=<MseLossBackward>)
output :  tensor([[89764.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(1527560.8750, grad_fn=<MseLossBackward>)
output :  tensor([[108519.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(269596.2188, grad_fn=<MseLossBackward>)
output :  tensor([[272916.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1342e+09, grad_fn=<MseLossBackward>)
output :  tensor([[232190.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(7895046.5000, grad_fn=<MseLossBackward>)
output :  tensor([[146047.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1096667.1250, grad_fn=<MseLossBackward>)
output :  tensor([[134712.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(7768501.5000, grad_fn=<MseLossBackward>)
output :  tensor([[173763.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(954.2307, grad_fn=<MseLossBackward>)
output :  tensor([[148415.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(10019104., grad_fn=<MseLossBackward>)
output :  tensor([[165797.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2386e+08, grad_fn=<MseLossBackward>)
output :  tensor([[168567.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(12729621., grad_fn=<MseLossBackward>)
output :  tensor([[137786.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(618631.4375, grad_fn=<MseLossBackward>)
output :  tensor([[190279.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5940e+09, grad_fn=<MseLossBackward>)
output :  tensor([[114816.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(7933816.5000, grad_fn=<MseLossBackward>)
output :  tensor([[172832.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(692484., grad_fn=<MseLossBackward>)
output :  tensor([[119641.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(128673.5391, grad_fn=<MseLossBackward>)
output :  tensor([[88366.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1866126.7500, grad_fn=<MseLossBackward>)
output :  tensor([[179364.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(404178.0625, grad_fn=<MseLossBackward>)
output :  tensor([[110760.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(739855.3125, grad_fn=<MseLossBackward>)
output :  tensor([[238492.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(257603.8281, grad_fn=<MseLossBackward>)
output :  tensor([[248316.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(10999898., grad_fn=<MseLossBackward>)
output :  tensor([[133262.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(14156406., grad_fn=<MseLossBackward>)
output :  tensor([[108337.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(386417.6250, grad_fn=<MseLossBackward>)
output :  tensor([[291521.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1209e+10, grad_fn=<MseLossBackward>)
output :  tensor([[176092.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(21092204., grad_fn=<MseLossBackward>)
output :  tensor([[124731.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(72289.5625, grad_fn=<MseLossBackward>)
output :  tensor([[146262.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9876e+08, grad_fn=<MseLossBackward>)
output :  tensor([[199124.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2128e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137647.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(11237790., grad_fn=<MseLossBackward>)
output :  tensor([[159424.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4538e+10, grad_fn=<MseLossBackward>)
output :  tensor([[153177.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(522074., grad_fn=<MseLossBackward>)
output :  tensor([[130358.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(737867.5625, grad_fn=<MseLossBackward>)
output :  tensor([[245355.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7728e+10, grad_fn=<MseLossBackward>)
output :  tensor([[396479.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(30478680., grad_fn=<MseLossBackward>)
output :  tensor([[104037.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(24623150., grad_fn=<MseLossBackward>)
output :  tensor([[120367.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(3486272.5000, grad_fn=<MseLossBackward>)
output :  tensor([[158725.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(600164.9375, grad_fn=<MseLossBackward>)
output :  tensor([[132553.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5996e+08, grad_fn=<MseLossBackward>)
output :  tensor([[162910.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4916e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173152.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9882e+09, grad_fn=<MseLossBackward>)
output :  tensor([[106544.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(8669482., grad_fn=<MseLossBackward>)
output :  tensor([[139891.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1228114.1250, grad_fn=<MseLossBackward>)
output :  tensor([[362490.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(23071810., grad_fn=<MseLossBackward>)
output :  tensor([[203688.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5312e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173572.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(3714714.2500, grad_fn=<MseLossBackward>)
output :  tensor([[207145.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(18021484., grad_fn=<MseLossBackward>)
output :  tensor([[138555.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(197941.5781, grad_fn=<MseLossBackward>)
output :  tensor([[193989.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(260402.9062, grad_fn=<MseLossBackward>)
output :  tensor([[137555.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(9.0331e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176678.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(18679278., grad_fn=<MseLossBackward>)
output :  tensor([[239265.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(7477575.5000, grad_fn=<MseLossBackward>)
output :  tensor([[169976.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(16188301., grad_fn=<MseLossBackward>)
output :  tensor([[108659.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(435301., grad_fn=<MseLossBackward>)
output :  tensor([[267922.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(11302624., grad_fn=<MseLossBackward>)
output :  tensor([[244546.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(29741514., grad_fn=<MseLossBackward>)
output :  tensor([[121282.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(2949994., grad_fn=<MseLossBackward>)
output :  tensor([[216444.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4287e+09, grad_fn=<MseLossBackward>)
output :  tensor([[303747.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6453e+08, grad_fn=<MseLossBackward>)
output :  tensor([[207789.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(623803.8125, grad_fn=<MseLossBackward>)
output :  tensor([[213634.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5968e+10, grad_fn=<MseLossBackward>)
output :  tensor([[158813.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(834510.8125, grad_fn=<MseLossBackward>)
output :  tensor([[166842.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(9905379., grad_fn=<MseLossBackward>)
output :  tensor([[163006.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(36898412., grad_fn=<MseLossBackward>)
output :  tensor([[173472.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(12059124., grad_fn=<MseLossBackward>)
output :  tensor([[232576.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2548e+09, grad_fn=<MseLossBackward>)
output :  tensor([[214843.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1353e+08, grad_fn=<MseLossBackward>)
output :  tensor([[162036.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2610e+08, grad_fn=<MseLossBackward>)
output :  tensor([[122562.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(191556.6719, grad_fn=<MseLossBackward>)
output :  tensor([[176913.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(7558.1289, grad_fn=<MseLossBackward>)
output :  tensor([[182142.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0618e+09, grad_fn=<MseLossBackward>)
output :  tensor([[208110.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4784e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134763.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(109840.4609, grad_fn=<MseLossBackward>)
output :  tensor([[150285.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2284e+08, grad_fn=<MseLossBackward>)
output :  tensor([[275633.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1867493.1250, grad_fn=<MseLossBackward>)
output :  tensor([[86138.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(1295453., grad_fn=<MseLossBackward>)
output :  tensor([[235547.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(906542., grad_fn=<MseLossBackward>)
output :  tensor([[258808.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0506e+11, grad_fn=<MseLossBackward>)
output :  tensor([[170082.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(6837.2227, grad_fn=<MseLossBackward>)
output :  tensor([[192569.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8004e+09, grad_fn=<MseLossBackward>)
output :  tensor([[153908.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1190690.1250, grad_fn=<MseLossBackward>)
output :  tensor([[205813.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1199e+09, grad_fn=<MseLossBackward>)
output :  tensor([[130845.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(3407312.2500, grad_fn=<MseLossBackward>)
output :  tensor([[145983.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(967579.6250, grad_fn=<MseLossBackward>)
output :  tensor([[169058.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0534e+08, grad_fn=<MseLossBackward>)
output :  tensor([[187902.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(4214745., grad_fn=<MseLossBackward>)
output :  tensor([[129136.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(9834741., grad_fn=<MseLossBackward>)
output :  tensor([[137198.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(488142.3750, grad_fn=<MseLossBackward>)
output :  tensor([[178388.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(29037616., grad_fn=<MseLossBackward>)
output :  tensor([[198463.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6560e+09, grad_fn=<MseLossBackward>)
output :  tensor([[239140.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(14894293., grad_fn=<MseLossBackward>)
output :  tensor([[152899.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(4412691., grad_fn=<MseLossBackward>)
output :  tensor([[195004.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(990460.3750, grad_fn=<MseLossBackward>)
output :  tensor([[166525.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0742e+08, grad_fn=<MseLossBackward>)
output :  tensor([[188766.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(85865416., grad_fn=<MseLossBackward>)
output :  tensor([[178571.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1766199.5000, grad_fn=<MseLossBackward>)
output :  tensor([[98472.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2167336., grad_fn=<MseLossBackward>)
output :  tensor([[172144.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1633e+10, grad_fn=<MseLossBackward>)
output :  tensor([[133484.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2298066.5000, grad_fn=<MseLossBackward>)
output :  tensor([[121576.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(43247576., grad_fn=<MseLossBackward>)
output :  tensor([[174903.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(815578.3125, grad_fn=<MseLossBackward>)
output :  tensor([[87397.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(5746133.5000, grad_fn=<MseLossBackward>)
output :  tensor([[287480.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(6348982.5000, grad_fn=<MseLossBackward>)
output :  tensor([[167927.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(8567603., grad_fn=<MseLossBackward>)
output :  tensor([[188547.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0915e+10, grad_fn=<MseLossBackward>)
output :  tensor([[246466.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0188e+08, grad_fn=<MseLossBackward>)
output :  tensor([[151004.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(16.8870, grad_fn=<MseLossBackward>)
output :  tensor([[123988.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(141.7588, grad_fn=<MseLossBackward>)
output :  tensor([[118758.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1303521.7500, grad_fn=<MseLossBackward>)
output :  tensor([[144510.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7086e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175981.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(3928076.2500, grad_fn=<MseLossBackward>)
output :  tensor([[109226.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1432e+08, grad_fn=<MseLossBackward>)
output :  tensor([[207628.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2182e+10, grad_fn=<MseLossBackward>)
output :  tensor([[241636.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(18751.8789, grad_fn=<MseLossBackward>)
output :  tensor([[249645.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1184e+10, grad_fn=<MseLossBackward>)
output :  tensor([[220156.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5509e+08, grad_fn=<MseLossBackward>)
output :  tensor([[194630.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4610e+10, grad_fn=<MseLossBackward>)
output :  tensor([[188251.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(564940.1250, grad_fn=<MseLossBackward>)
output :  tensor([[205525.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8112e+10, grad_fn=<MseLossBackward>)
output :  tensor([[187749.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1978e+10, grad_fn=<MseLossBackward>)
output :  tensor([[177834.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(820722.7500, grad_fn=<MseLossBackward>)
output :  tensor([[151709.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(84363.0156, grad_fn=<MseLossBackward>)
output :  tensor([[340728.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(13904975., grad_fn=<MseLossBackward>)
output :  tensor([[215061.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(9375366., grad_fn=<MseLossBackward>)
output :  tensor([[159347.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(426102.9688, grad_fn=<MseLossBackward>)
output :  tensor([[186911.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9799e+09, grad_fn=<MseLossBackward>)
output :  tensor([[103805.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(1426139.7500, grad_fn=<MseLossBackward>)
output :  tensor([[271684.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0267e+10, grad_fn=<MseLossBackward>)
output :  tensor([[169642.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(18125374., grad_fn=<MseLossBackward>)
output :  tensor([[218560.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(25608818., grad_fn=<MseLossBackward>)
output :  tensor([[209432.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3382e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180176.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(954498.5000, grad_fn=<MseLossBackward>)
output :  tensor([[207457.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(32007836., grad_fn=<MseLossBackward>)
output :  tensor([[157596.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(6743760., grad_fn=<MseLossBackward>)
output :  tensor([[150095.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5095e+09, grad_fn=<MseLossBackward>)
output :  tensor([[119542.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(1085943.1250, grad_fn=<MseLossBackward>)
output :  tensor([[139429.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(325060.3438, grad_fn=<MseLossBackward>)
output :  tensor([[148169.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(690197.5000, grad_fn=<MseLossBackward>)
output :  tensor([[201689.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5954e+10, grad_fn=<MseLossBackward>)
output :  tensor([[160670.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1370362.8750, grad_fn=<MseLossBackward>)
output :  tensor([[99929.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(184537.3594, grad_fn=<MseLossBackward>)
output :  tensor([[225217.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1851e+08, grad_fn=<MseLossBackward>)
output :  tensor([[186658.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4767e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176838.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(125061.6953, grad_fn=<MseLossBackward>)
output :  tensor([[82753.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(567515.0625, grad_fn=<MseLossBackward>)
output :  tensor([[130849.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(5521068., grad_fn=<MseLossBackward>)
output :  tensor([[215535.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2357040.5000, grad_fn=<MseLossBackward>)
output :  tensor([[142820.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1391699.5000, grad_fn=<MseLossBackward>)
output :  tensor([[131346.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1813356.7500, grad_fn=<MseLossBackward>)
output :  tensor([[144490.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(3572749.7500, grad_fn=<MseLossBackward>)
output :  tensor([[177816.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6254e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146688.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(7227024., grad_fn=<MseLossBackward>)
output :  tensor([[159858.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(19929.4980, grad_fn=<MseLossBackward>)
output :  tensor([[214973.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(690.7041, grad_fn=<MseLossBackward>)
output :  tensor([[136755.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0084e+09, grad_fn=<MseLossBackward>)
output :  tensor([[257597.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(6749117., grad_fn=<MseLossBackward>)
output :  tensor([[157972.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2333733.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128870.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(137623.6094, grad_fn=<MseLossBackward>)
output :  tensor([[98036.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(9222989., grad_fn=<MseLossBackward>)
output :  tensor([[153982.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8278e+09, grad_fn=<MseLossBackward>)
output :  tensor([[178239.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2758298.2500, grad_fn=<MseLossBackward>)
output :  tensor([[123903.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(11586631., grad_fn=<MseLossBackward>)
output :  tensor([[186103.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8358e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145284.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3275e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151971.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(4291177., grad_fn=<MseLossBackward>)
output :  tensor([[187539.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(44205.0625, grad_fn=<MseLossBackward>)
output :  tensor([[249766.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8758e+09, grad_fn=<MseLossBackward>)
output :  tensor([[90938.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(315484.0625, grad_fn=<MseLossBackward>)
output :  tensor([[236298.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(13702837., grad_fn=<MseLossBackward>)
output :  tensor([[126923.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(2484096.2500, grad_fn=<MseLossBackward>)
output :  tensor([[165934.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9932e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113854.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9194e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177588.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2522339.5000, grad_fn=<MseLossBackward>)
output :  tensor([[164703.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4026e+08, grad_fn=<MseLossBackward>)
output :  tensor([[155538.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2692e+08, grad_fn=<MseLossBackward>)
output :  tensor([[239434.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(188898.8906, grad_fn=<MseLossBackward>)
output :  tensor([[225573.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0515e+09, grad_fn=<MseLossBackward>)
output :  tensor([[124111.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(8345508.5000, grad_fn=<MseLossBackward>)
output :  tensor([[124644.1016]], grad_fn=<AddmmBackward>)
loss:  tensor(1838460.6250, grad_fn=<MseLossBackward>)
output :  tensor([[226191.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(653849.1250, grad_fn=<MseLossBackward>)
output :  tensor([[230480.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(12384571., grad_fn=<MseLossBackward>)
output :  tensor([[225127.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2473002., grad_fn=<MseLossBackward>)
output :  tensor([[146963.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1075239.3750, grad_fn=<MseLossBackward>)
output :  tensor([[212503.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(6268764., grad_fn=<MseLossBackward>)
output :  tensor([[131231.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2616e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135692.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(10194850., grad_fn=<MseLossBackward>)
output :  tensor([[308516.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(42035368., grad_fn=<MseLossBackward>)
output :  tensor([[138155.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(8091536., grad_fn=<MseLossBackward>)
output :  tensor([[119034.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7076e+09, grad_fn=<MseLossBackward>)
output :  tensor([[109105.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(155630.2500, grad_fn=<MseLossBackward>)
output :  tensor([[154504.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2384e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179970.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(8.9785e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166013.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(48809000., grad_fn=<MseLossBackward>)
output :  tensor([[191689.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(86679304., grad_fn=<MseLossBackward>)
output :  tensor([[104647.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(21602234., grad_fn=<MseLossBackward>)
output :  tensor([[177599.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1960087.5000, grad_fn=<MseLossBackward>)
output :  tensor([[167935.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1250.2854, grad_fn=<MseLossBackward>)
output :  tensor([[136168.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(8018454., grad_fn=<MseLossBackward>)
output :  tensor([[260330.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(9.7555e+09, grad_fn=<MseLossBackward>)
output :  tensor([[141426.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1839e+09, grad_fn=<MseLossBackward>)
output :  tensor([[175256.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(5090241., grad_fn=<MseLossBackward>)
output :  tensor([[142739.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(7503234., grad_fn=<MseLossBackward>)
output :  tensor([[201139.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(409200.0938, grad_fn=<MseLossBackward>)
output :  tensor([[169257.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(551027.8750, grad_fn=<MseLossBackward>)
output :  tensor([[241573.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(5888054., grad_fn=<MseLossBackward>)
output :  tensor([[133375.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1264184., grad_fn=<MseLossBackward>)
output :  tensor([[152097.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(7549185.5000, grad_fn=<MseLossBackward>)
output :  tensor([[210857.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(17156552., grad_fn=<MseLossBackward>)
output :  tensor([[163694.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1704452.6250, grad_fn=<MseLossBackward>)
output :  tensor([[190067.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1138822.5000, grad_fn=<MseLossBackward>)
output :  tensor([[133993.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2533e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131410.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(5810133.5000, grad_fn=<MseLossBackward>)
output :  tensor([[136423.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(12794258., grad_fn=<MseLossBackward>)
output :  tensor([[199806.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8572e+09, grad_fn=<MseLossBackward>)
output :  tensor([[165412.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5414e+09, grad_fn=<MseLossBackward>)
output :  tensor([[77011.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8939e+08, grad_fn=<MseLossBackward>)
output :  tensor([[94634.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0270e+08, grad_fn=<MseLossBackward>)
output :  tensor([[252627.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(443451.9375, grad_fn=<MseLossBackward>)
output :  tensor([[202259.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0018e+09, grad_fn=<MseLossBackward>)
output :  tensor([[115205.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(42101.9102, grad_fn=<MseLossBackward>)
output :  tensor([[155425.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0287e+09, grad_fn=<MseLossBackward>)
output :  tensor([[205318.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1555e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179133.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2567e+09, grad_fn=<MseLossBackward>)
output :  tensor([[156021.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1044036.9375, grad_fn=<MseLossBackward>)
output :  tensor([[167467.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(6411103., grad_fn=<MseLossBackward>)
output :  tensor([[112297.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(7306082.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163468.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(71708080., grad_fn=<MseLossBackward>)
output :  tensor([[194068.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6465e+08, grad_fn=<MseLossBackward>)
output :  tensor([[219901.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(161490.9531, grad_fn=<MseLossBackward>)
output :  tensor([[245748.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4925e+11, grad_fn=<MseLossBackward>)
output :  tensor([[153989.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(48849616., grad_fn=<MseLossBackward>)
output :  tensor([[106336.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(4594224., grad_fn=<MseLossBackward>)
output :  tensor([[170282.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3497e+08, grad_fn=<MseLossBackward>)
output :  tensor([[150321.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(31945.9766, grad_fn=<MseLossBackward>)
output :  tensor([[236937.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(3869.2288, grad_fn=<MseLossBackward>)
output :  tensor([[113942.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(1119248.2500, grad_fn=<MseLossBackward>)
output :  tensor([[178659.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(17978262., grad_fn=<MseLossBackward>)
output :  tensor([[187925.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1500969.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163566.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4471e+10, grad_fn=<MseLossBackward>)
output :  tensor([[96450.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3871e+08, grad_fn=<MseLossBackward>)
output :  tensor([[236607.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(5723757., grad_fn=<MseLossBackward>)
output :  tensor([[176189.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(35880.6484, grad_fn=<MseLossBackward>)
output :  tensor([[140902.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(815324.3750, grad_fn=<MseLossBackward>)
output :  tensor([[239139.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(17132874., grad_fn=<MseLossBackward>)
output :  tensor([[165048.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4194368., grad_fn=<MseLossBackward>)
output :  tensor([[200432.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5517e+10, grad_fn=<MseLossBackward>)
output :  tensor([[135296.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(87977.1250, grad_fn=<MseLossBackward>)
output :  tensor([[185367.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4604e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135303.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(484437.7500, grad_fn=<MseLossBackward>)
output :  tensor([[227325.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(75248304., grad_fn=<MseLossBackward>)
output :  tensor([[222700.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4526e+08, grad_fn=<MseLossBackward>)
output :  tensor([[91290.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(1665652.3750, grad_fn=<MseLossBackward>)
output :  tensor([[157450.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3932846.7500, grad_fn=<MseLossBackward>)
output :  tensor([[246906.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5369e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145594.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(352984.5000, grad_fn=<MseLossBackward>)
output :  tensor([[112736.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0919e+09, grad_fn=<MseLossBackward>)
output :  tensor([[162436.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(4256678., grad_fn=<MseLossBackward>)
output :  tensor([[144869.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(756084.6250, grad_fn=<MseLossBackward>)
output :  tensor([[127913.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(82207.6406, grad_fn=<MseLossBackward>)
output :  tensor([[190065.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7519e+09, grad_fn=<MseLossBackward>)
output :  tensor([[123157.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(432696.7188, grad_fn=<MseLossBackward>)
output :  tensor([[152336.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(113442.6562, grad_fn=<MseLossBackward>)
output :  tensor([[169324.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(5881762., grad_fn=<MseLossBackward>)
output :  tensor([[150860.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(19412.3262, grad_fn=<MseLossBackward>)
output :  tensor([[154217.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(75393136., grad_fn=<MseLossBackward>)
output :  tensor([[135871.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2208e+08, grad_fn=<MseLossBackward>)
output :  tensor([[132613.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(376133.0625, grad_fn=<MseLossBackward>)
output :  tensor([[153461.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0913e+08, grad_fn=<MseLossBackward>)
output :  tensor([[146623.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(6106613., grad_fn=<MseLossBackward>)
output :  tensor([[161442.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(94268.1875, grad_fn=<MseLossBackward>)
output :  tensor([[141301.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(9.8604e+08, grad_fn=<MseLossBackward>)
output :  tensor([[146436.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(5588053., grad_fn=<MseLossBackward>)
output :  tensor([[185859.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4580001.5000, grad_fn=<MseLossBackward>)
output :  tensor([[167653.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1814324.8750, grad_fn=<MseLossBackward>)
output :  tensor([[178976.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1046816.7500, grad_fn=<MseLossBackward>)
output :  tensor([[219059.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(884128.8125, grad_fn=<MseLossBackward>)
output :  tensor([[110111.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(4889454., grad_fn=<MseLossBackward>)
output :  tensor([[139551.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1465e+08, grad_fn=<MseLossBackward>)
output :  tensor([[281438.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(20805856., grad_fn=<MseLossBackward>)
output :  tensor([[117522.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(2317958.7500, grad_fn=<MseLossBackward>)
output :  tensor([[176633.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8806e+09, grad_fn=<MseLossBackward>)
output :  tensor([[180920.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(16643340., grad_fn=<MseLossBackward>)
output :  tensor([[191789.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(39552308., grad_fn=<MseLossBackward>)
output :  tensor([[250413.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0448e+08, grad_fn=<MseLossBackward>)
output :  tensor([[222526.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(277152.9062, grad_fn=<MseLossBackward>)
output :  tensor([[129140.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4011e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177236.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8741e+08, grad_fn=<MseLossBackward>)
output :  tensor([[123841.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(25241.2656, grad_fn=<MseLossBackward>)
output :  tensor([[184664.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4575e+10, grad_fn=<MseLossBackward>)
output :  tensor([[154129.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1275099.7500, grad_fn=<MseLossBackward>)
output :  tensor([[156374.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(97503280., grad_fn=<MseLossBackward>)
output :  tensor([[202079.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(17814862., grad_fn=<MseLossBackward>)
output :  tensor([[145265.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6295e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174569.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2047582.1250, grad_fn=<MseLossBackward>)
output :  tensor([[251665.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7477e+08, grad_fn=<MseLossBackward>)
output :  tensor([[149513.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2289831., grad_fn=<MseLossBackward>)
output :  tensor([[201394.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1614130.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163524.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(12774370., grad_fn=<MseLossBackward>)
output :  tensor([[126588.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4890e+09, grad_fn=<MseLossBackward>)
output :  tensor([[138069.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(5378558., grad_fn=<MseLossBackward>)
output :  tensor([[179858.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(17149952., grad_fn=<MseLossBackward>)
output :  tensor([[193997.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(15982505., grad_fn=<MseLossBackward>)
output :  tensor([[229154.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5815e+09, grad_fn=<MseLossBackward>)
output :  tensor([[255213.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(3190968.2500, grad_fn=<MseLossBackward>)
output :  tensor([[183815.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8275e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145290.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8934e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151054.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(42955324., grad_fn=<MseLossBackward>)
output :  tensor([[76189.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3097e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144549.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(91187880., grad_fn=<MseLossBackward>)
output :  tensor([[130795.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(3593453.5000, grad_fn=<MseLossBackward>)
output :  tensor([[156399.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(5758875., grad_fn=<MseLossBackward>)
output :  tensor([[124571.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(5898219.5000, grad_fn=<MseLossBackward>)
output :  tensor([[79299.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(7838512.5000, grad_fn=<MseLossBackward>)
output :  tensor([[83791.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(3210592., grad_fn=<MseLossBackward>)
output :  tensor([[236969.]], grad_fn=<AddmmBackward>)
loss:  tensor(24690960., grad_fn=<MseLossBackward>)
output :  tensor([[143436.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(9.5704e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134293.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(14390405., grad_fn=<MseLossBackward>)
output :  tensor([[165612.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1925589.8750, grad_fn=<MseLossBackward>)
output :  tensor([[236177.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1386248.6250, grad_fn=<MseLossBackward>)
output :  tensor([[192669.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(279956.7188, grad_fn=<MseLossBackward>)
output :  tensor([[154095.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3627001.2500, grad_fn=<MseLossBackward>)
output :  tensor([[198971.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1148045.2500, grad_fn=<MseLossBackward>)
output :  tensor([[200646.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3216e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137832.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(692250., grad_fn=<MseLossBackward>)
output :  tensor([[156529.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2339657., grad_fn=<MseLossBackward>)
output :  tensor([[135478.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(272157.8438, grad_fn=<MseLossBackward>)
output :  tensor([[197932.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0283e+09, grad_fn=<MseLossBackward>)
output :  tensor([[155736.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(3014998.2500, grad_fn=<MseLossBackward>)
output :  tensor([[139636.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1286e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146218.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1737618.2500, grad_fn=<MseLossBackward>)
output :  tensor([[212373.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(139350.5625, grad_fn=<MseLossBackward>)
output :  tensor([[104779.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1891e+08, grad_fn=<MseLossBackward>)
output :  tensor([[167867.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(134826.6562, grad_fn=<MseLossBackward>)
output :  tensor([[126842.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(1340149.8750, grad_fn=<MseLossBackward>)
output :  tensor([[146513.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(236743.0625, grad_fn=<MseLossBackward>)
output :  tensor([[104101.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7405e+09, grad_fn=<MseLossBackward>)
output :  tensor([[138539.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1081015.1250, grad_fn=<MseLossBackward>)
output :  tensor([[240431.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(19642486., grad_fn=<MseLossBackward>)
output :  tensor([[144124.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(765871.1250, grad_fn=<MseLossBackward>)
output :  tensor([[137756.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(66024.9062, grad_fn=<MseLossBackward>)
output :  tensor([[164971.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3669e+09, grad_fn=<MseLossBackward>)
output :  tensor([[265246.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6265e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173638.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1854490.7500, grad_fn=<MseLossBackward>)
output :  tensor([[105821.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(9277450., grad_fn=<MseLossBackward>)
output :  tensor([[201654.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7525e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161292.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(5256702.5000, grad_fn=<MseLossBackward>)
output :  tensor([[161969.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6422e+10, grad_fn=<MseLossBackward>)
output :  tensor([[99511.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1467770.1250, grad_fn=<MseLossBackward>)
output :  tensor([[121334.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(5130260.5000, grad_fn=<MseLossBackward>)
output :  tensor([[157293.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1674233.8750, grad_fn=<MseLossBackward>)
output :  tensor([[139540.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(211039.7500, grad_fn=<MseLossBackward>)
output :  tensor([[199897.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(10586.4805, grad_fn=<MseLossBackward>)
output :  tensor([[143969.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(3878868.7500, grad_fn=<MseLossBackward>)
output :  tensor([[259513.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(7654041., grad_fn=<MseLossBackward>)
output :  tensor([[128569.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2652e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164493.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1012381.8125, grad_fn=<MseLossBackward>)
output :  tensor([[189269.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(591553.2500, grad_fn=<MseLossBackward>)
output :  tensor([[122623.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5934e+08, grad_fn=<MseLossBackward>)
output :  tensor([[244229.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(33301736., grad_fn=<MseLossBackward>)
output :  tensor([[158935.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8762e+08, grad_fn=<MseLossBackward>)
output :  tensor([[243561.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(3198117.5000, grad_fn=<MseLossBackward>)
output :  tensor([[142701.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1686751.5000, grad_fn=<MseLossBackward>)
output :  tensor([[211030.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1061479.5000, grad_fn=<MseLossBackward>)
output :  tensor([[173032.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(400214.3750, grad_fn=<MseLossBackward>)
output :  tensor([[151538.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(6058751.5000, grad_fn=<MseLossBackward>)
output :  tensor([[119457.4922]], grad_fn=<AddmmBackward>)
loss:  tensor(2124283.5000, grad_fn=<MseLossBackward>)
output :  tensor([[235412.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6706e+09, grad_fn=<MseLossBackward>)
output :  tensor([[239853.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(21489.7266, grad_fn=<MseLossBackward>)
output :  tensor([[152887.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(202317.2344, grad_fn=<MseLossBackward>)
output :  tensor([[253767.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1281848.5000, grad_fn=<MseLossBackward>)
output :  tensor([[122046.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(56885416., grad_fn=<MseLossBackward>)
output :  tensor([[178343.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(5492724.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163390.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(11492524., grad_fn=<MseLossBackward>)
output :  tensor([[130342.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(432522.0312, grad_fn=<MseLossBackward>)
output :  tensor([[195282.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3273e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166259.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(5106258., grad_fn=<MseLossBackward>)
output :  tensor([[161799.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1440825.1250, grad_fn=<MseLossBackward>)
output :  tensor([[158715.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(511493.1562, grad_fn=<MseLossBackward>)
output :  tensor([[147519.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(5668194., grad_fn=<MseLossBackward>)
output :  tensor([[172749.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0005e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164226.]], grad_fn=<AddmmBackward>)
loss:  tensor(17859076., grad_fn=<MseLossBackward>)
output :  tensor([[376135.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(61380860., grad_fn=<MseLossBackward>)
output :  tensor([[126507.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(243025.8906, grad_fn=<MseLossBackward>)
output :  tensor([[129884.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9700e+09, grad_fn=<MseLossBackward>)
output :  tensor([[280430.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(612501.8750, grad_fn=<MseLossBackward>)
output :  tensor([[163822.]], grad_fn=<AddmmBackward>)
loss:  tensor(3319684., grad_fn=<MseLossBackward>)
output :  tensor([[133494.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6885e+08, grad_fn=<MseLossBackward>)
output :  tensor([[226823.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(26800358., grad_fn=<MseLossBackward>)
output :  tensor([[182154.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2738973.2500, grad_fn=<MseLossBackward>)
output :  tensor([[153136.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1291632.2500, grad_fn=<MseLossBackward>)
output :  tensor([[145061.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3770.7275, grad_fn=<MseLossBackward>)
output :  tensor([[156835.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9741e+08, grad_fn=<MseLossBackward>)
output :  tensor([[102075.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(4307732.5000, grad_fn=<MseLossBackward>)
output :  tensor([[78125.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2854e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166047.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1098074.7500, grad_fn=<MseLossBackward>)
output :  tensor([[188622.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5505e+09, grad_fn=<MseLossBackward>)
output :  tensor([[160003.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(4014200., grad_fn=<MseLossBackward>)
output :  tensor([[158005.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(255182.8438, grad_fn=<MseLossBackward>)
output :  tensor([[136340.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1230158.2500, grad_fn=<MseLossBackward>)
output :  tensor([[205663.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(82073.2969, grad_fn=<MseLossBackward>)
output :  tensor([[140585.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(6683275., grad_fn=<MseLossBackward>)
output :  tensor([[182347.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6295e+10, grad_fn=<MseLossBackward>)
output :  tensor([[150890.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(23918978., grad_fn=<MseLossBackward>)
output :  tensor([[111842.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3191e+08, grad_fn=<MseLossBackward>)
output :  tensor([[95222.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1495002.8750, grad_fn=<MseLossBackward>)
output :  tensor([[176170.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1369594.7500, grad_fn=<MseLossBackward>)
output :  tensor([[255953.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(19768862., grad_fn=<MseLossBackward>)
output :  tensor([[144908.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(11617553., grad_fn=<MseLossBackward>)
output :  tensor([[159773.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(14823.0625, grad_fn=<MseLossBackward>)
output :  tensor([[131042.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2123850.7500, grad_fn=<MseLossBackward>)
output :  tensor([[150543.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1089185.7500, grad_fn=<MseLossBackward>)
output :  tensor([[172052.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(17242866., grad_fn=<MseLossBackward>)
output :  tensor([[131058.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(16475100., grad_fn=<MseLossBackward>)
output :  tensor([[174274.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5698e+08, grad_fn=<MseLossBackward>)
output :  tensor([[159890.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(8357248.5000, grad_fn=<MseLossBackward>)
output :  tensor([[116457.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1798.2900, grad_fn=<MseLossBackward>)
output :  tensor([[162460.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9758e+09, grad_fn=<MseLossBackward>)
output :  tensor([[53474.8008]], grad_fn=<AddmmBackward>)
loss:  tensor(2175037.2500, grad_fn=<MseLossBackward>)
output :  tensor([[231441.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5705e+09, grad_fn=<MseLossBackward>)
output :  tensor([[201281.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(79136.7188, grad_fn=<MseLossBackward>)
output :  tensor([[186088.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1185546.6250, grad_fn=<MseLossBackward>)
output :  tensor([[104299.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(2893215., grad_fn=<MseLossBackward>)
output :  tensor([[89689.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(7234713., grad_fn=<MseLossBackward>)
output :  tensor([[142285.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(5224367.5000, grad_fn=<MseLossBackward>)
output :  tensor([[218669.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6747e+09, grad_fn=<MseLossBackward>)
output :  tensor([[201501.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(35983500., grad_fn=<MseLossBackward>)
output :  tensor([[166496.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2238764., grad_fn=<MseLossBackward>)
output :  tensor([[172571.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5430e+09, grad_fn=<MseLossBackward>)
output :  tensor([[190128.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(16612.7930, grad_fn=<MseLossBackward>)
output :  tensor([[90539.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(12525074., grad_fn=<MseLossBackward>)
output :  tensor([[140015.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(242.1914, grad_fn=<MseLossBackward>)
output :  tensor([[113500.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(9003047., grad_fn=<MseLossBackward>)
output :  tensor([[146704.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1545e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173730.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8259e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193362.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3542e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178370.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2654913.7500, grad_fn=<MseLossBackward>)
output :  tensor([[97478.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(957294.0625, grad_fn=<MseLossBackward>)
output :  tensor([[119144.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(2703994.7500, grad_fn=<MseLossBackward>)
output :  tensor([[161688.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9782e+08, grad_fn=<MseLossBackward>)
output :  tensor([[201020.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1040431.8750, grad_fn=<MseLossBackward>)
output :  tensor([[140778.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(10375445., grad_fn=<MseLossBackward>)
train_loss: [2.6248814e+09]
epoch_result tensor([0.])
output :  tensor([[157219.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1640440.6250, grad_fn=<MseLossBackward>)
output :  tensor([[121479.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(270822.6562, grad_fn=<MseLossBackward>)
output :  tensor([[199731.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(30591788., grad_fn=<MseLossBackward>)
output :  tensor([[175736.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1596590.2500, grad_fn=<MseLossBackward>)
output :  tensor([[155425.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0961e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129399.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(1958622.1250, grad_fn=<MseLossBackward>)
output :  tensor([[142420.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2017332., grad_fn=<MseLossBackward>)
output :  tensor([[118644.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(126419.1328, grad_fn=<MseLossBackward>)
output :  tensor([[70493.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4385e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166506.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(256573.9062, grad_fn=<MseLossBackward>)
output :  tensor([[149014.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(81258112., grad_fn=<MseLossBackward>)
output :  tensor([[226569.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2461908., grad_fn=<MseLossBackward>)
output :  tensor([[167146.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(3436910.5000, grad_fn=<MseLossBackward>)
output :  tensor([[246924.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(7700798.5000, grad_fn=<MseLossBackward>)
output :  tensor([[56041.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(1085519.7500, grad_fn=<MseLossBackward>)
output :  tensor([[163741.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7025e+08, grad_fn=<MseLossBackward>)
output :  tensor([[170631.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(19083246., grad_fn=<MseLossBackward>)
output :  tensor([[154542.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(3830460.5000, grad_fn=<MseLossBackward>)
output :  tensor([[276531.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2344918., grad_fn=<MseLossBackward>)
output :  tensor([[192860.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(17136496., grad_fn=<MseLossBackward>)
output :  tensor([[137703.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5513e+10, grad_fn=<MseLossBackward>)
output :  tensor([[193705.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(30015.5625, grad_fn=<MseLossBackward>)
output :  tensor([[177453.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2512e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150454.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(297962.4688, grad_fn=<MseLossBackward>)
output :  tensor([[169215.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(615808.0625, grad_fn=<MseLossBackward>)
output :  tensor([[85776.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(141840.5000, grad_fn=<MseLossBackward>)
output :  tensor([[168932.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1284e+09, grad_fn=<MseLossBackward>)
output :  tensor([[182991.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(4033256.2500, grad_fn=<MseLossBackward>)
output :  tensor([[204123.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6396e+09, grad_fn=<MseLossBackward>)
output :  tensor([[109987.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(162.1643, grad_fn=<MseLossBackward>)
output :  tensor([[170288.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(505787.6562, grad_fn=<MseLossBackward>)
output :  tensor([[137821.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1746155.7500, grad_fn=<MseLossBackward>)
output :  tensor([[129755.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(570685.8125, grad_fn=<MseLossBackward>)
output :  tensor([[118631.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(754631.5625, grad_fn=<MseLossBackward>)
output :  tensor([[146668.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8023e+08, grad_fn=<MseLossBackward>)
output :  tensor([[168571.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1441e+10, grad_fn=<MseLossBackward>)
output :  tensor([[151337.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2679922.5000, grad_fn=<MseLossBackward>)
output :  tensor([[180183.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(33649.3164, grad_fn=<MseLossBackward>)
output :  tensor([[141776.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(603025.0625, grad_fn=<MseLossBackward>)
output :  tensor([[110288.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1161e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136354.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1852e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137802.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(7852167., grad_fn=<MseLossBackward>)
output :  tensor([[131813.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(23172190., grad_fn=<MseLossBackward>)
output :  tensor([[225572.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(327273.3750, grad_fn=<MseLossBackward>)
output :  tensor([[133125.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(765789.0625, grad_fn=<MseLossBackward>)
output :  tensor([[146178.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(7960157., grad_fn=<MseLossBackward>)
output :  tensor([[112452.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(204975.4844, grad_fn=<MseLossBackward>)
output :  tensor([[158325.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2803427., grad_fn=<MseLossBackward>)
output :  tensor([[148472.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1648e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193033.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1068413., grad_fn=<MseLossBackward>)
output :  tensor([[135879.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2043336.2500, grad_fn=<MseLossBackward>)
output :  tensor([[107719.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(5200929.5000, grad_fn=<MseLossBackward>)
output :  tensor([[231353.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(7002887., grad_fn=<MseLossBackward>)
output :  tensor([[164514.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3986e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158732.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(71364.1172, grad_fn=<MseLossBackward>)
output :  tensor([[204809.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8120e+10, grad_fn=<MseLossBackward>)
output :  tensor([[245348.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1805e+10, grad_fn=<MseLossBackward>)
output :  tensor([[141302.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(4830105., grad_fn=<MseLossBackward>)
output :  tensor([[137732.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(13930040., grad_fn=<MseLossBackward>)
output :  tensor([[154516.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(233409.7656, grad_fn=<MseLossBackward>)
output :  tensor([[133806.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(14491940., grad_fn=<MseLossBackward>)
output :  tensor([[180370.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3408e+09, grad_fn=<MseLossBackward>)
output :  tensor([[184783.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(467791.8750, grad_fn=<MseLossBackward>)
output :  tensor([[162285.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(617157.5625, grad_fn=<MseLossBackward>)
output :  tensor([[139722.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(10740470., grad_fn=<MseLossBackward>)
output :  tensor([[143773.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1622478.8750, grad_fn=<MseLossBackward>)
output :  tensor([[147230.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4972969.5000, grad_fn=<MseLossBackward>)
output :  tensor([[173667.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3585e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192334.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0841e+08, grad_fn=<MseLossBackward>)
output :  tensor([[138516.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(4066020.2500, grad_fn=<MseLossBackward>)
output :  tensor([[174164.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(5129022., grad_fn=<MseLossBackward>)
output :  tensor([[177403.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(12931328., grad_fn=<MseLossBackward>)
output :  tensor([[115221.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(49103.7891, grad_fn=<MseLossBackward>)
output :  tensor([[224468.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(12030601., grad_fn=<MseLossBackward>)
output :  tensor([[183761.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(68423.1172, grad_fn=<MseLossBackward>)
output :  tensor([[125908.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(166623.4062, grad_fn=<MseLossBackward>)
output :  tensor([[197405.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(819562.4375, grad_fn=<MseLossBackward>)
output :  tensor([[175316.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(173719.6406, grad_fn=<MseLossBackward>)
output :  tensor([[205790.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2566e+10, grad_fn=<MseLossBackward>)
output :  tensor([[212527.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2332063., grad_fn=<MseLossBackward>)
output :  tensor([[166829.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2838e+09, grad_fn=<MseLossBackward>)
output :  tensor([[189315.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(26874180., grad_fn=<MseLossBackward>)
output :  tensor([[115015.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(4061579., grad_fn=<MseLossBackward>)
output :  tensor([[111846.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(427654.6875, grad_fn=<MseLossBackward>)
output :  tensor([[112644.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(415934.3125, grad_fn=<MseLossBackward>)
output :  tensor([[147904.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1220265.3750, grad_fn=<MseLossBackward>)
output :  tensor([[159487.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3546e+10, grad_fn=<MseLossBackward>)
output :  tensor([[176749.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(10568391., grad_fn=<MseLossBackward>)
output :  tensor([[126877.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(387671.6250, grad_fn=<MseLossBackward>)
output :  tensor([[143451.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2396497.5000, grad_fn=<MseLossBackward>)
output :  tensor([[178995.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9444e+09, grad_fn=<MseLossBackward>)
output :  tensor([[117499.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(359625.0938, grad_fn=<MseLossBackward>)
output :  tensor([[195494.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2265918.7500, grad_fn=<MseLossBackward>)
output :  tensor([[146309.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1714135.5000, grad_fn=<MseLossBackward>)
output :  tensor([[207273.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(31658206., grad_fn=<MseLossBackward>)
output :  tensor([[123985.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(4059501., grad_fn=<MseLossBackward>)
output :  tensor([[247933.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(155322.2031, grad_fn=<MseLossBackward>)
output :  tensor([[234388.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5615e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151388.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9955e+08, grad_fn=<MseLossBackward>)
output :  tensor([[85561.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0324e+08, grad_fn=<MseLossBackward>)
output :  tensor([[192561.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7796e+09, grad_fn=<MseLossBackward>)
output :  tensor([[87294.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(39615616., grad_fn=<MseLossBackward>)
output :  tensor([[140817.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1736094.5000, grad_fn=<MseLossBackward>)
output :  tensor([[75158.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(116531.5547, grad_fn=<MseLossBackward>)
output :  tensor([[143935.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(964354.6875, grad_fn=<MseLossBackward>)
output :  tensor([[176578.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(334969.6562, grad_fn=<MseLossBackward>)
output :  tensor([[152938.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(315089.2500, grad_fn=<MseLossBackward>)
output :  tensor([[109743.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(5493640., grad_fn=<MseLossBackward>)
output :  tensor([[204619.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2350e+10, grad_fn=<MseLossBackward>)
output :  tensor([[127734.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(585798.8750, grad_fn=<MseLossBackward>)
output :  tensor([[268393.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3471e+08, grad_fn=<MseLossBackward>)
output :  tensor([[300325.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(93587488., grad_fn=<MseLossBackward>)
output :  tensor([[108582.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1171096., grad_fn=<MseLossBackward>)
output :  tensor([[170323.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(4735316., grad_fn=<MseLossBackward>)
output :  tensor([[133430.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4672e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134955.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(16360255., grad_fn=<MseLossBackward>)
output :  tensor([[129821.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(183458.2969, grad_fn=<MseLossBackward>)
output :  tensor([[126051.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1105258., grad_fn=<MseLossBackward>)
output :  tensor([[132768.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4143e+08, grad_fn=<MseLossBackward>)
output :  tensor([[227329.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8287e+10, grad_fn=<MseLossBackward>)
output :  tensor([[188326.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3309e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143638.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(68227.0703, grad_fn=<MseLossBackward>)
output :  tensor([[129979.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(6147843., grad_fn=<MseLossBackward>)
output :  tensor([[110897.]], grad_fn=<AddmmBackward>)
loss:  tensor(124609., grad_fn=<MseLossBackward>)
output :  tensor([[254095.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0916e+09, grad_fn=<MseLossBackward>)
output :  tensor([[134927.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(5190.7520, grad_fn=<MseLossBackward>)
output :  tensor([[199856.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(9882083., grad_fn=<MseLossBackward>)
output :  tensor([[101758.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(9871575., grad_fn=<MseLossBackward>)
output :  tensor([[138594.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1836914.3750, grad_fn=<MseLossBackward>)
output :  tensor([[206528.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2299e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179839.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(3675.3906, grad_fn=<MseLossBackward>)
output :  tensor([[187097.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(4401473., grad_fn=<MseLossBackward>)
output :  tensor([[163791.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1085e+10, grad_fn=<MseLossBackward>)
output :  tensor([[301227.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1406e+09, grad_fn=<MseLossBackward>)
output :  tensor([[198075.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(30822.1914, grad_fn=<MseLossBackward>)
output :  tensor([[256237.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1498e+10, grad_fn=<MseLossBackward>)
output :  tensor([[220455.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0743e+09, grad_fn=<MseLossBackward>)
output :  tensor([[279489.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4071e+09, grad_fn=<MseLossBackward>)
output :  tensor([[224161.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(26137.7949, grad_fn=<MseLossBackward>)
output :  tensor([[222638.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8683e+10, grad_fn=<MseLossBackward>)
output :  tensor([[198915.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(3669918.5000, grad_fn=<MseLossBackward>)
output :  tensor([[158861.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(8.9173e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136013.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(12347867., grad_fn=<MseLossBackward>)
output :  tensor([[135986.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(236864.7188, grad_fn=<MseLossBackward>)
output :  tensor([[91714.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(510365.1250, grad_fn=<MseLossBackward>)
output :  tensor([[104879.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(9739861., grad_fn=<MseLossBackward>)
output :  tensor([[275362.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8662e+09, grad_fn=<MseLossBackward>)
output :  tensor([[237677.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(7169173.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144751.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(61713.4297, grad_fn=<MseLossBackward>)
output :  tensor([[139557.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(4231570.5000, grad_fn=<MseLossBackward>)
output :  tensor([[174064.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(110099.5312, grad_fn=<MseLossBackward>)
output :  tensor([[146143.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(799096.3125, grad_fn=<MseLossBackward>)
output :  tensor([[163723.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(9.4719e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165993.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(987135.3750, grad_fn=<MseLossBackward>)
output :  tensor([[137321.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(103482.8438, grad_fn=<MseLossBackward>)
output :  tensor([[189633.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5070e+09, grad_fn=<MseLossBackward>)
output :  tensor([[112263.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(69580.5469, grad_fn=<MseLossBackward>)
output :  tensor([[169565.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(5927323., grad_fn=<MseLossBackward>)
output :  tensor([[121211.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1467808., grad_fn=<MseLossBackward>)
output :  tensor([[87602.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(362836.8125, grad_fn=<MseLossBackward>)
output :  tensor([[180101.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(10235.7480, grad_fn=<MseLossBackward>)
output :  tensor([[108950.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(901060.7500, grad_fn=<MseLossBackward>)
output :  tensor([[237528.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2164898.5000, grad_fn=<MseLossBackward>)
output :  tensor([[242017.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(8893535., grad_fn=<MseLossBackward>)
output :  tensor([[129395.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(11013.5186, grad_fn=<MseLossBackward>)
output :  tensor([[112534.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(12786379., grad_fn=<MseLossBackward>)
output :  tensor([[287964.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2257e+10, grad_fn=<MseLossBackward>)
output :  tensor([[170644.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(731853.5000, grad_fn=<MseLossBackward>)
output :  tensor([[130059.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(25599726., grad_fn=<MseLossBackward>)
output :  tensor([[143261.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3817e+08, grad_fn=<MseLossBackward>)
output :  tensor([[200245.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8919e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137599.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(11563507., grad_fn=<MseLossBackward>)
output :  tensor([[155772.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5432e+10, grad_fn=<MseLossBackward>)
output :  tensor([[157767.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(14955018., grad_fn=<MseLossBackward>)
output :  tensor([[131276.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(3155508.2500, grad_fn=<MseLossBackward>)
output :  tensor([[244338.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7999e+10, grad_fn=<MseLossBackward>)
output :  tensor([[396815.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(26882928., grad_fn=<MseLossBackward>)
output :  tensor([[114175.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(26786770., grad_fn=<MseLossBackward>)
output :  tensor([[109759.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(76391968., grad_fn=<MseLossBackward>)
output :  tensor([[159966.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(217928.5000, grad_fn=<MseLossBackward>)
output :  tensor([[132177.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7621e+08, grad_fn=<MseLossBackward>)
output :  tensor([[161984.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6018e+09, grad_fn=<MseLossBackward>)
output :  tensor([[175598.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3031e+09, grad_fn=<MseLossBackward>)
output :  tensor([[103910.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(96419.9531, grad_fn=<MseLossBackward>)
output :  tensor([[138304.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(7265046.5000, grad_fn=<MseLossBackward>)
output :  tensor([[357570.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(94548272., grad_fn=<MseLossBackward>)
output :  tensor([[201048.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8039e+09, grad_fn=<MseLossBackward>)
output :  tensor([[181152.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(31956232., grad_fn=<MseLossBackward>)
output :  tensor([[197972.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(24278254., grad_fn=<MseLossBackward>)
output :  tensor([[134341.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(21701186., grad_fn=<MseLossBackward>)
output :  tensor([[193728.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(594609.6875, grad_fn=<MseLossBackward>)
output :  tensor([[134322.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1946e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180480.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(269377.2188, grad_fn=<MseLossBackward>)
output :  tensor([[240656.]], grad_fn=<AddmmBackward>)
loss:  tensor(1806336., grad_fn=<MseLossBackward>)
output :  tensor([[171109.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(8356255., grad_fn=<MseLossBackward>)
output :  tensor([[105379.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(6866283.5000, grad_fn=<MseLossBackward>)
output :  tensor([[266151.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2530286.7500, grad_fn=<MseLossBackward>)
output :  tensor([[246792.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(10290262., grad_fn=<MseLossBackward>)
output :  tensor([[123544.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(296182.5625, grad_fn=<MseLossBackward>)
output :  tensor([[216778.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3898e+09, grad_fn=<MseLossBackward>)
output :  tensor([[296536.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2736e+08, grad_fn=<MseLossBackward>)
output :  tensor([[206248.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(565010.6250, grad_fn=<MseLossBackward>)
output :  tensor([[214056.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5862e+10, grad_fn=<MseLossBackward>)
output :  tensor([[158588.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(474268.9375, grad_fn=<MseLossBackward>)
output :  tensor([[169212.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(604554.8750, grad_fn=<MseLossBackward>)
output :  tensor([[160797.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(14942694., grad_fn=<MseLossBackward>)
output :  tensor([[170952.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(906452.7500, grad_fn=<MseLossBackward>)
output :  tensor([[236784.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(9.7440e+08, grad_fn=<MseLossBackward>)
output :  tensor([[216370.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7122e+08, grad_fn=<MseLossBackward>)
output :  tensor([[162218.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3160e+08, grad_fn=<MseLossBackward>)
output :  tensor([[125126.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(4523929.5000, grad_fn=<MseLossBackward>)
output :  tensor([[175775.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1500433.6250, grad_fn=<MseLossBackward>)
output :  tensor([[178681.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6127e+09, grad_fn=<MseLossBackward>)
output :  tensor([[205625.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5718e+10, grad_fn=<MseLossBackward>)
output :  tensor([[136725.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(5262006., grad_fn=<MseLossBackward>)
output :  tensor([[153347.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0079e+09, grad_fn=<MseLossBackward>)
output :  tensor([[279217.]], grad_fn=<AddmmBackward>)
loss:  tensor(4915089., grad_fn=<MseLossBackward>)
output :  tensor([[89688.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(21980934., grad_fn=<MseLossBackward>)
output :  tensor([[235586.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(834967.6250, grad_fn=<MseLossBackward>)
output :  tensor([[260275.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0411e+11, grad_fn=<MseLossBackward>)
output :  tensor([[171446.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2092633.5000, grad_fn=<MseLossBackward>)
output :  tensor([[193584.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7153e+09, grad_fn=<MseLossBackward>)
output :  tensor([[152004.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(8970680., grad_fn=<MseLossBackward>)
output :  tensor([[205256.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1917e+09, grad_fn=<MseLossBackward>)
output :  tensor([[130534.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2355074., grad_fn=<MseLossBackward>)
output :  tensor([[144647.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(124322.3516, grad_fn=<MseLossBackward>)
output :  tensor([[170631.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9136e+08, grad_fn=<MseLossBackward>)
output :  tensor([[184109.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(3027980.7500, grad_fn=<MseLossBackward>)
output :  tensor([[125620.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(144293.1406, grad_fn=<MseLossBackward>)
output :  tensor([[135893.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(368259.3438, grad_fn=<MseLossBackward>)
output :  tensor([[171040.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(3839334., grad_fn=<MseLossBackward>)
output :  tensor([[199265.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5740e+09, grad_fn=<MseLossBackward>)
output :  tensor([[240165.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(8035542., grad_fn=<MseLossBackward>)
output :  tensor([[153177.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(3322018.7500, grad_fn=<MseLossBackward>)
output :  tensor([[197377.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1898324.2500, grad_fn=<MseLossBackward>)
output :  tensor([[166073.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8724e+08, grad_fn=<MseLossBackward>)
output :  tensor([[185914.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(41148816., grad_fn=<MseLossBackward>)
output :  tensor([[180037.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(18983.6719, grad_fn=<MseLossBackward>)
output :  tensor([[99615.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(6838715.5000, grad_fn=<MseLossBackward>)
output :  tensor([[174492.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1132e+10, grad_fn=<MseLossBackward>)
output :  tensor([[137215.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(4908855.5000, grad_fn=<MseLossBackward>)
output :  tensor([[120715.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(32670602., grad_fn=<MseLossBackward>)
output :  tensor([[171092.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(8454192., grad_fn=<MseLossBackward>)
output :  tensor([[84406.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(352372.0938, grad_fn=<MseLossBackward>)
output :  tensor([[288297.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2897867.7500, grad_fn=<MseLossBackward>)
output :  tensor([[164254.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(555467.4375, grad_fn=<MseLossBackward>)
output :  tensor([[191147.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0170e+10, grad_fn=<MseLossBackward>)
output :  tensor([[243450.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5898e+08, grad_fn=<MseLossBackward>)
output :  tensor([[152317.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1734777.1250, grad_fn=<MseLossBackward>)
output :  tensor([[124575.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(331461.0625, grad_fn=<MseLossBackward>)
output :  tensor([[122401.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(6256369., grad_fn=<MseLossBackward>)
output :  tensor([[145580.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(9.3519e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174303.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(92235.5859, grad_fn=<MseLossBackward>)
output :  tensor([[112268.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8616e+08, grad_fn=<MseLossBackward>)
output :  tensor([[207390.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2234e+10, grad_fn=<MseLossBackward>)
output :  tensor([[224281.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9648e+08, grad_fn=<MseLossBackward>)
output :  tensor([[250778.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0855e+10, grad_fn=<MseLossBackward>)
output :  tensor([[223669.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3501e+08, grad_fn=<MseLossBackward>)
output :  tensor([[195573.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4382e+10, grad_fn=<MseLossBackward>)
output :  tensor([[189404.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(3628429.7500, grad_fn=<MseLossBackward>)
output :  tensor([[205937.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7931e+10, grad_fn=<MseLossBackward>)
output :  tensor([[188875.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1645e+10, grad_fn=<MseLossBackward>)
output :  tensor([[181103.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(5584507.5000, grad_fn=<MseLossBackward>)
output :  tensor([[153029.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1059323.3750, grad_fn=<MseLossBackward>)
output :  tensor([[333410.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(12881818., grad_fn=<MseLossBackward>)
output :  tensor([[208303.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(13663304., grad_fn=<MseLossBackward>)
output :  tensor([[160854.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(729476.1250, grad_fn=<MseLossBackward>)
output :  tensor([[185733.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1099e+09, grad_fn=<MseLossBackward>)
output :  tensor([[107182.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(4762078.5000, grad_fn=<MseLossBackward>)
output :  tensor([[267904.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2424e+10, grad_fn=<MseLossBackward>)
output :  tensor([[170194.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(13728646., grad_fn=<MseLossBackward>)
output :  tensor([[212650.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(722314.0625, grad_fn=<MseLossBackward>)
output :  tensor([[206770.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0247e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179505.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(93063.1250, grad_fn=<MseLossBackward>)
output :  tensor([[201919.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(14242.9307, grad_fn=<MseLossBackward>)
output :  tensor([[157037.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(4152807.2500, grad_fn=<MseLossBackward>)
output :  tensor([[148659.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3677e+09, grad_fn=<MseLossBackward>)
output :  tensor([[117335.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1354968.7500, grad_fn=<MseLossBackward>)
output :  tensor([[139610.]], grad_fn=<AddmmBackward>)
loss:  tensor(152100., grad_fn=<MseLossBackward>)
output :  tensor([[148500.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(249625.1406, grad_fn=<MseLossBackward>)
output :  tensor([[199273.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6570e+10, grad_fn=<MseLossBackward>)
output :  tensor([[159409.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(8235.5625, grad_fn=<MseLossBackward>)
output :  tensor([[101600.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(4413085., grad_fn=<MseLossBackward>)
output :  tensor([[223907.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5897e+08, grad_fn=<MseLossBackward>)
output :  tensor([[187175.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6984e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177293.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(653217.5625, grad_fn=<MseLossBackward>)
output :  tensor([[84649.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(7020802.5000, grad_fn=<MseLossBackward>)
output :  tensor([[129850.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1825158.7500, grad_fn=<MseLossBackward>)
output :  tensor([[214047.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2266.6526, grad_fn=<MseLossBackward>)
output :  tensor([[143178.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(674528.5625, grad_fn=<MseLossBackward>)
output :  tensor([[128362.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(2680869., grad_fn=<MseLossBackward>)
output :  tensor([[145878.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(10746923., grad_fn=<MseLossBackward>)
output :  tensor([[178473.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6789e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145152.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1327824.1250, grad_fn=<MseLossBackward>)
output :  tensor([[160856.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(733565.5000, grad_fn=<MseLossBackward>)
output :  tensor([[215386.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(149008.0625, grad_fn=<MseLossBackward>)
output :  tensor([[138230.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1043e+09, grad_fn=<MseLossBackward>)
output :  tensor([[258474.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(12071933., grad_fn=<MseLossBackward>)
output :  tensor([[160274.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(600092.3125, grad_fn=<MseLossBackward>)
output :  tensor([[129451.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(905069.8125, grad_fn=<MseLossBackward>)
output :  tensor([[93980.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1038806.8750, grad_fn=<MseLossBackward>)
output :  tensor([[153621.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7778e+09, grad_fn=<MseLossBackward>)
output :  tensor([[177510.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(5710457., grad_fn=<MseLossBackward>)
output :  tensor([[116497.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(16018818., grad_fn=<MseLossBackward>)
output :  tensor([[190662.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4660e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145758.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3901e+09, grad_fn=<MseLossBackward>)
output :  tensor([[149128.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(595381., grad_fn=<MseLossBackward>)
output :  tensor([[187619.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(16981.3477, grad_fn=<MseLossBackward>)
output :  tensor([[251943.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6919e+09, grad_fn=<MseLossBackward>)
output :  tensor([[92594.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(1197605.3750, grad_fn=<MseLossBackward>)
output :  tensor([[238565.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2056580.1250, grad_fn=<MseLossBackward>)
output :  tensor([[126677.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(3322588.5000, grad_fn=<MseLossBackward>)
output :  tensor([[167238.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(9.7341e+09, grad_fn=<MseLossBackward>)
output :  tensor([[114947.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2344e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174962.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1076276.6250, grad_fn=<MseLossBackward>)
output :  tensor([[166133.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1465e+08, grad_fn=<MseLossBackward>)
output :  tensor([[155614.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3074e+08, grad_fn=<MseLossBackward>)
output :  tensor([[235389.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(13034356., grad_fn=<MseLossBackward>)
output :  tensor([[225451.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0594e+09, grad_fn=<MseLossBackward>)
output :  tensor([[124408.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(6714455., grad_fn=<MseLossBackward>)
output :  tensor([[127708.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(2918732., grad_fn=<MseLossBackward>)
output :  tensor([[222731.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(18224094., grad_fn=<MseLossBackward>)
output :  tensor([[226761.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(52389324., grad_fn=<MseLossBackward>)
output :  tensor([[231464.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(22702544., grad_fn=<MseLossBackward>)
output :  tensor([[148117.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(13703.6289, grad_fn=<MseLossBackward>)
output :  tensor([[201954.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(64727808., grad_fn=<MseLossBackward>)
output :  tensor([[128336.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(69491112., grad_fn=<MseLossBackward>)
output :  tensor([[136281.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(14303051., grad_fn=<MseLossBackward>)
output :  tensor([[311203.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(14410091., grad_fn=<MseLossBackward>)
output :  tensor([[142584.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2509749., grad_fn=<MseLossBackward>)
output :  tensor([[121755.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9981e+09, grad_fn=<MseLossBackward>)
output :  tensor([[108223.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(1628953.6250, grad_fn=<MseLossBackward>)
output :  tensor([[156139.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6768e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178463.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2663e+09, grad_fn=<MseLossBackward>)
output :  tensor([[170090.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(8463554., grad_fn=<MseLossBackward>)
output :  tensor([[191442.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(91338040., grad_fn=<MseLossBackward>)
output :  tensor([[101323.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(1751218., grad_fn=<MseLossBackward>)
output :  tensor([[180132.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1281494.7500, grad_fn=<MseLossBackward>)
output :  tensor([[164140.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(14131256., grad_fn=<MseLossBackward>)
output :  tensor([[139590.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(349059.4062, grad_fn=<MseLossBackward>)
output :  tensor([[265033.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8485e+09, grad_fn=<MseLossBackward>)
output :  tensor([[142608.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3188e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173591.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(349909.2188, grad_fn=<MseLossBackward>)
output :  tensor([[143470.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(12042852., grad_fn=<MseLossBackward>)
output :  tensor([[197920.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(6653659., grad_fn=<MseLossBackward>)
output :  tensor([[167990.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(4039660.2500, grad_fn=<MseLossBackward>)
output :  tensor([[240357.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(13265416., grad_fn=<MseLossBackward>)
output :  tensor([[133556.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(890015.3750, grad_fn=<MseLossBackward>)
output :  tensor([[153707.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(18986444., grad_fn=<MseLossBackward>)
output :  tensor([[212523.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(6135219.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162236.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(7639350.5000, grad_fn=<MseLossBackward>)
output :  tensor([[185105.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(15166400., grad_fn=<MseLossBackward>)
output :  tensor([[131652.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4786e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128280.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(517140.7500, grad_fn=<MseLossBackward>)
output :  tensor([[137035.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(8788075., grad_fn=<MseLossBackward>)
output :  tensor([[202377.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5054e+09, grad_fn=<MseLossBackward>)
output :  tensor([[169567.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9776e+09, grad_fn=<MseLossBackward>)
output :  tensor([[75222.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3172e+08, grad_fn=<MseLossBackward>)
output :  tensor([[94279.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(95643816., grad_fn=<MseLossBackward>)
output :  tensor([[257325.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(16263955., grad_fn=<MseLossBackward>)
output :  tensor([[200563.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7900e+09, grad_fn=<MseLossBackward>)
output :  tensor([[115871.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(759362.4375, grad_fn=<MseLossBackward>)
output :  tensor([[160126.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4931e+08, grad_fn=<MseLossBackward>)
output :  tensor([[208848.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2435e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177714.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5166e+09, grad_fn=<MseLossBackward>)
output :  tensor([[155729.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(531873.9375, grad_fn=<MseLossBackward>)
output :  tensor([[170733.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(537563.9375, grad_fn=<MseLossBackward>)
output :  tensor([[111045.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(15635599., grad_fn=<MseLossBackward>)
output :  tensor([[165131.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0266e+08, grad_fn=<MseLossBackward>)
output :  tensor([[195003.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4152e+08, grad_fn=<MseLossBackward>)
output :  tensor([[219707.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(43147.0781, grad_fn=<MseLossBackward>)
output :  tensor([[245173.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4983e+11, grad_fn=<MseLossBackward>)
output :  tensor([[149450.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(6003419., grad_fn=<MseLossBackward>)
output :  tensor([[111355.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(8266254., grad_fn=<MseLossBackward>)
output :  tensor([[167931.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9513e+08, grad_fn=<MseLossBackward>)
output :  tensor([[153642.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(9878351., grad_fn=<MseLossBackward>)
output :  tensor([[238700.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2890372., grad_fn=<MseLossBackward>)
output :  tensor([[113494.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2265307.2500, grad_fn=<MseLossBackward>)
output :  tensor([[177628.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(27785088., grad_fn=<MseLossBackward>)
output :  tensor([[183603.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(9586764., grad_fn=<MseLossBackward>)
output :  tensor([[167043.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3396e+10, grad_fn=<MseLossBackward>)
output :  tensor([[95144.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0006e+08, grad_fn=<MseLossBackward>)
output :  tensor([[237644.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1836363.7500, grad_fn=<MseLossBackward>)
output :  tensor([[177349.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1820138.2500, grad_fn=<MseLossBackward>)
output :  tensor([[139867.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(17457.0156, grad_fn=<MseLossBackward>)
output :  tensor([[232406.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(6728268.5000, grad_fn=<MseLossBackward>)
output :  tensor([[156602.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(40925208., grad_fn=<MseLossBackward>)
output :  tensor([[198447.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6016e+10, grad_fn=<MseLossBackward>)
output :  tensor([[132247.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(7578665., grad_fn=<MseLossBackward>)
output :  tensor([[185962.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7420e+08, grad_fn=<MseLossBackward>)
output :  tensor([[138013.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(4055377.7500, grad_fn=<MseLossBackward>)
output :  tensor([[225350.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1341e+08, grad_fn=<MseLossBackward>)
output :  tensor([[227025.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2782e+08, grad_fn=<MseLossBackward>)
output :  tensor([[89832.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(28035.3164, grad_fn=<MseLossBackward>)
output :  tensor([[162587.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(9946928., grad_fn=<MseLossBackward>)
output :  tensor([[243765.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6158e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144635.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(132621.1562, grad_fn=<MseLossBackward>)
output :  tensor([[108963.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7609e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163972.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(278239.7812, grad_fn=<MseLossBackward>)
output :  tensor([[141441.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(6547761.5000, grad_fn=<MseLossBackward>)
output :  tensor([[131233.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(9200985., grad_fn=<MseLossBackward>)
output :  tensor([[190946.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6313e+09, grad_fn=<MseLossBackward>)
output :  tensor([[126155.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(13362794., grad_fn=<MseLossBackward>)
output :  tensor([[150758.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1540274.8750, grad_fn=<MseLossBackward>)
output :  tensor([[169280.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(6096578.5000, grad_fn=<MseLossBackward>)
output :  tensor([[150427.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(328132.0625, grad_fn=<MseLossBackward>)
output :  tensor([[160776.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(4511110.5000, grad_fn=<MseLossBackward>)
output :  tensor([[136005.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2932e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130010.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(3957706.2500, grad_fn=<MseLossBackward>)
output :  tensor([[153541.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1145e+08, grad_fn=<MseLossBackward>)
output :  tensor([[147294.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(9876681., grad_fn=<MseLossBackward>)
output :  tensor([[162994.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1549519.2500, grad_fn=<MseLossBackward>)
output :  tensor([[141296.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(9.8577e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148809.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(85.8518, grad_fn=<MseLossBackward>)
output :  tensor([[185541.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(6042301.5000, grad_fn=<MseLossBackward>)
output :  tensor([[170698.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2883575.5000, grad_fn=<MseLossBackward>)
output :  tensor([[179204.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(632944.5625, grad_fn=<MseLossBackward>)
output :  tensor([[221240.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1538724., grad_fn=<MseLossBackward>)
output :  tensor([[110453.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(6518407.5000, grad_fn=<MseLossBackward>)
output :  tensor([[137822.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6700e+08, grad_fn=<MseLossBackward>)
output :  tensor([[285934.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(4290.2500, grad_fn=<MseLossBackward>)
output :  tensor([[114866.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1284432.6250, grad_fn=<MseLossBackward>)
output :  tensor([[176329.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9071e+09, grad_fn=<MseLossBackward>)
output :  tensor([[179902.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(25988488., grad_fn=<MseLossBackward>)
output :  tensor([[190634.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(26366138., grad_fn=<MseLossBackward>)
output :  tensor([[251908.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3324e+08, grad_fn=<MseLossBackward>)
output :  tensor([[223000.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1000687.6250, grad_fn=<MseLossBackward>)
output :  tensor([[126748.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3466e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176038.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3075e+08, grad_fn=<MseLossBackward>)
output :  tensor([[126478.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(6144472.5000, grad_fn=<MseLossBackward>)
output :  tensor([[184412.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4703e+10, grad_fn=<MseLossBackward>)
output :  tensor([[151071.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3720016.2500, grad_fn=<MseLossBackward>)
output :  tensor([[155490.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(80826000., grad_fn=<MseLossBackward>)
output :  tensor([[206059.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(58028.2930, grad_fn=<MseLossBackward>)
output :  tensor([[144265.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3842e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176342.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(117209.9453, grad_fn=<MseLossBackward>)
output :  tensor([[249607.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(8.9354e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148604.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(365344.6875, grad_fn=<MseLossBackward>)
output :  tensor([[203594.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(864115.5000, grad_fn=<MseLossBackward>)
output :  tensor([[161502.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2410450.2500, grad_fn=<MseLossBackward>)
output :  tensor([[125262.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3885e+09, grad_fn=<MseLossBackward>)
output :  tensor([[134057.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2864080.2500, grad_fn=<MseLossBackward>)
output :  tensor([[183271.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(530188.7500, grad_fn=<MseLossBackward>)
output :  tensor([[198228.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(67701784., grad_fn=<MseLossBackward>)
output :  tensor([[227718.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7554e+09, grad_fn=<MseLossBackward>)
output :  tensor([[251793.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(27107154., grad_fn=<MseLossBackward>)
output :  tensor([[183662.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8316e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145053.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8680e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145618.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1250692.7500, grad_fn=<MseLossBackward>)
output :  tensor([[71085.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6633e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135229.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(52892.8125, grad_fn=<MseLossBackward>)
output :  tensor([[129993.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(1196784.7500, grad_fn=<MseLossBackward>)
output :  tensor([[155904.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(3627775., grad_fn=<MseLossBackward>)
output :  tensor([[130147.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(9906904., grad_fn=<MseLossBackward>)
output :  tensor([[80648.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(17207330., grad_fn=<MseLossBackward>)
output :  tensor([[83270.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(1613713.7500, grad_fn=<MseLossBackward>)
output :  tensor([[224141.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(61761424., grad_fn=<MseLossBackward>)
output :  tensor([[142551.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(9.0310e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128080.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(5853753.5000, grad_fn=<MseLossBackward>)
output :  tensor([[165796.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1447547.3750, grad_fn=<MseLossBackward>)
output :  tensor([[232085.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(8495676., grad_fn=<MseLossBackward>)
output :  tensor([[189375.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(7644706.5000, grad_fn=<MseLossBackward>)
output :  tensor([[157222.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1495270.3750, grad_fn=<MseLossBackward>)
output :  tensor([[199628.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2988036.2500, grad_fn=<MseLossBackward>)
output :  tensor([[201003.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2958e+09, grad_fn=<MseLossBackward>)
output :  tensor([[135456.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2382585.2500, grad_fn=<MseLossBackward>)
output :  tensor([[156533.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2350951.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135187.]], grad_fn=<AddmmBackward>)
loss:  tensor(660969., grad_fn=<MseLossBackward>)
output :  tensor([[198548.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(9.8922e+08, grad_fn=<MseLossBackward>)
output :  tensor([[157630.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(13178488., grad_fn=<MseLossBackward>)
output :  tensor([[136782.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8734e+09, grad_fn=<MseLossBackward>)
output :  tensor([[142775.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(4511442.5000, grad_fn=<MseLossBackward>)
output :  tensor([[206693.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(28158278., grad_fn=<MseLossBackward>)
output :  tensor([[103094.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4500e+08, grad_fn=<MseLossBackward>)
output :  tensor([[164737.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(7632701., grad_fn=<MseLossBackward>)
output :  tensor([[128632.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(399611.6562, grad_fn=<MseLossBackward>)
output :  tensor([[147071.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(5049.8789, grad_fn=<MseLossBackward>)
output :  tensor([[107663.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0503e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136197.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1695977.1250, grad_fn=<MseLossBackward>)
output :  tensor([[233634.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(5596551.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145638.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(408201.1875, grad_fn=<MseLossBackward>)
output :  tensor([[140582.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(9504407., grad_fn=<MseLossBackward>)
output :  tensor([[165613.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4148e+09, grad_fn=<MseLossBackward>)
output :  tensor([[267960.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0079e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179219.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(17807082., grad_fn=<MseLossBackward>)
output :  tensor([[102379.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(156995.4844, grad_fn=<MseLossBackward>)
output :  tensor([[200813.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8808e+09, grad_fn=<MseLossBackward>)
output :  tensor([[156745.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(5081854.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162579.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6159e+10, grad_fn=<MseLossBackward>)
output :  tensor([[99443.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1308450., grad_fn=<MseLossBackward>)
output :  tensor([[122175.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2028443.5000, grad_fn=<MseLossBackward>)
output :  tensor([[154974.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1052034.8750, grad_fn=<MseLossBackward>)
output :  tensor([[142273.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(5168660., grad_fn=<MseLossBackward>)
output :  tensor([[200431.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(186205.7344, grad_fn=<MseLossBackward>)
output :  tensor([[135889.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(37335156., grad_fn=<MseLossBackward>)
output :  tensor([[260033.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(5046130.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128452.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2569e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163045.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(6022729.5000, grad_fn=<MseLossBackward>)
output :  tensor([[189584.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1175496.3750, grad_fn=<MseLossBackward>)
output :  tensor([[120430.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0881e+08, grad_fn=<MseLossBackward>)
output :  tensor([[251257.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1580834.7500, grad_fn=<MseLossBackward>)
output :  tensor([[160507.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0186e+08, grad_fn=<MseLossBackward>)
output :  tensor([[244150.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1439362.6250, grad_fn=<MseLossBackward>)
output :  tensor([[147171.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(10059403., grad_fn=<MseLossBackward>)
output :  tensor([[209623.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(141599.3438, grad_fn=<MseLossBackward>)
output :  tensor([[177507.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(26085758., grad_fn=<MseLossBackward>)
output :  tensor([[153466.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(284272.2500, grad_fn=<MseLossBackward>)
output :  tensor([[115449.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(6505050., grad_fn=<MseLossBackward>)
output :  tensor([[242477.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9903e+09, grad_fn=<MseLossBackward>)
output :  tensor([[239294.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(498369.8125, grad_fn=<MseLossBackward>)
output :  tensor([[154383.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1095391.1250, grad_fn=<MseLossBackward>)
output :  tensor([[252615.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(5220011., grad_fn=<MseLossBackward>)
output :  tensor([[125878.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2939e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175844.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(24107.4141, grad_fn=<MseLossBackward>)
output :  tensor([[162389.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(5709038., grad_fn=<MseLossBackward>)
output :  tensor([[131647.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(418952.7812, grad_fn=<MseLossBackward>)
output :  tensor([[194071.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1695e+09, grad_fn=<MseLossBackward>)
output :  tensor([[162585.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1999837.8750, grad_fn=<MseLossBackward>)
output :  tensor([[164688.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2850926.7500, grad_fn=<MseLossBackward>)
output :  tensor([[157562.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(191419.9219, grad_fn=<MseLossBackward>)
output :  tensor([[151865.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3863190.2500, grad_fn=<MseLossBackward>)
output :  tensor([[172465.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9646e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164745.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(22516804., grad_fn=<MseLossBackward>)
output :  tensor([[379417.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(20728956., grad_fn=<MseLossBackward>)
output :  tensor([[137328.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0668e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128892.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8829e+09, grad_fn=<MseLossBackward>)
output :  tensor([[281811.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(357641.3750, grad_fn=<MseLossBackward>)
output :  tensor([[162846.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(716456.4375, grad_fn=<MseLossBackward>)
output :  tensor([[130562.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0126e+08, grad_fn=<MseLossBackward>)
output :  tensor([[235432.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(11779697., grad_fn=<MseLossBackward>)
output :  tensor([[180672.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(29804.7852, grad_fn=<MseLossBackward>)
output :  tensor([[151667.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(110691.3672, grad_fn=<MseLossBackward>)
output :  tensor([[143281.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2954101.5000, grad_fn=<MseLossBackward>)
output :  tensor([[156423.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8115e+08, grad_fn=<MseLossBackward>)
output :  tensor([[102514.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(6323142.5000, grad_fn=<MseLossBackward>)
output :  tensor([[79029.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6212e+08, grad_fn=<MseLossBackward>)
output :  tensor([[167035.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(4144850.7500, grad_fn=<MseLossBackward>)
output :  tensor([[186846.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6936e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157653.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(120322.2656, grad_fn=<MseLossBackward>)
output :  tensor([[153394.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(16858852., grad_fn=<MseLossBackward>)
output :  tensor([[141223.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(14242368., grad_fn=<MseLossBackward>)
output :  tensor([[209820.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(14982343., grad_fn=<MseLossBackward>)
output :  tensor([[141401.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(11568502., grad_fn=<MseLossBackward>)
output :  tensor([[183111.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6101e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144266.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3005130.5000, grad_fn=<MseLossBackward>)
output :  tensor([[110579.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6064e+08, grad_fn=<MseLossBackward>)
output :  tensor([[97472.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(12056412., grad_fn=<MseLossBackward>)
output :  tensor([[174717.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(79629.7812, grad_fn=<MseLossBackward>)
output :  tensor([[264245.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(14786188., grad_fn=<MseLossBackward>)
output :  tensor([[137511.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(15904767., grad_fn=<MseLossBackward>)
output :  tensor([[160564.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(448544.1250, grad_fn=<MseLossBackward>)
output :  tensor([[135180.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(7186169., grad_fn=<MseLossBackward>)
output :  tensor([[145898.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(12972378., grad_fn=<MseLossBackward>)
output :  tensor([[167158.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(549451.5625, grad_fn=<MseLossBackward>)
output :  tensor([[126555.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(197656.6562, grad_fn=<MseLossBackward>)
output :  tensor([[174716.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8307e+08, grad_fn=<MseLossBackward>)
output :  tensor([[158460.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2131873.7500, grad_fn=<MseLossBackward>)
output :  tensor([[121141.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(21543160., grad_fn=<MseLossBackward>)
output :  tensor([[161512.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1104e+09, grad_fn=<MseLossBackward>)
output :  tensor([[53525.4336]], grad_fn=<AddmmBackward>)
loss:  tensor(2326947.7500, grad_fn=<MseLossBackward>)
output :  tensor([[231886.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4985e+09, grad_fn=<MseLossBackward>)
output :  tensor([[200773.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(51451., grad_fn=<MseLossBackward>)
output :  tensor([[185445.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(198428.4844, grad_fn=<MseLossBackward>)
output :  tensor([[106088.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(7841.9326, grad_fn=<MseLossBackward>)
output :  tensor([[88825.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(3332478.7500, grad_fn=<MseLossBackward>)
output :  tensor([[137996.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(4012447.2500, grad_fn=<MseLossBackward>)
output :  tensor([[221352.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2777e+09, grad_fn=<MseLossBackward>)
output :  tensor([[201810.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(32371832., grad_fn=<MseLossBackward>)
output :  tensor([[166675.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2807405., grad_fn=<MseLossBackward>)
output :  tensor([[171068.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8232e+09, grad_fn=<MseLossBackward>)
output :  tensor([[189047.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(907613.5000, grad_fn=<MseLossBackward>)
output :  tensor([[90907.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(15266908., grad_fn=<MseLossBackward>)
output :  tensor([[140140.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(19836.9609, grad_fn=<MseLossBackward>)
output :  tensor([[110185.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(98949.5625, grad_fn=<MseLossBackward>)
output :  tensor([[150936.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2429e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172916.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7570e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193341.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3593e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179847.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(23361.2109, grad_fn=<MseLossBackward>)
output :  tensor([[94962.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(2365083.5000, grad_fn=<MseLossBackward>)
output :  tensor([[117854.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(125349.1875, grad_fn=<MseLossBackward>)
output :  tensor([[160376.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5807e+08, grad_fn=<MseLossBackward>)
output :  tensor([[197673.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(5411003., grad_fn=<MseLossBackward>)
output :  tensor([[143259.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(548039.4375, grad_fn=<MseLossBackward>)
train_loss: [2.6259256e+09]
epoch_result tensor([0.])
output :  tensor([[157252.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1557075., grad_fn=<MseLossBackward>)
output :  tensor([[124486.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(6184003.5000, grad_fn=<MseLossBackward>)
output :  tensor([[196187.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3947299.7500, grad_fn=<MseLossBackward>)
output :  tensor([[176969.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(914.1174, grad_fn=<MseLossBackward>)
output :  tensor([[154492.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5260e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131288.]], grad_fn=<AddmmBackward>)
loss:  tensor(10810944., grad_fn=<MseLossBackward>)
output :  tensor([[138248.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(7571010., grad_fn=<MseLossBackward>)
output :  tensor([[119448.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(200718., grad_fn=<MseLossBackward>)
output :  tensor([[68182.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(93753984., grad_fn=<MseLossBackward>)
output :  tensor([[166806.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(649661.1875, grad_fn=<MseLossBackward>)
output :  tensor([[132546.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(55552800., grad_fn=<MseLossBackward>)
output :  tensor([[224377.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(387661.8750, grad_fn=<MseLossBackward>)
output :  tensor([[169958.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(918063.3750, grad_fn=<MseLossBackward>)
output :  tensor([[250457.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(573498.5625, grad_fn=<MseLossBackward>)
output :  tensor([[56039.9961]], grad_fn=<AddmmBackward>)
loss:  tensor(1081591.8750, grad_fn=<MseLossBackward>)
output :  tensor([[162319.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1755e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178179.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(10111307., grad_fn=<MseLossBackward>)
output :  tensor([[171411.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2235e+08, grad_fn=<MseLossBackward>)
output :  tensor([[274766.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(54653.6719, grad_fn=<MseLossBackward>)
output :  tensor([[194172.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(7992194., grad_fn=<MseLossBackward>)
output :  tensor([[136167.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6359e+10, grad_fn=<MseLossBackward>)
output :  tensor([[196584.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(7317278.5000, grad_fn=<MseLossBackward>)
output :  tensor([[179004.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1064e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150556.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(196525.9688, grad_fn=<MseLossBackward>)
output :  tensor([[176163.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(37988924., grad_fn=<MseLossBackward>)
output :  tensor([[84490.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(827716.1250, grad_fn=<MseLossBackward>)
output :  tensor([[168668.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0989e+09, grad_fn=<MseLossBackward>)
output :  tensor([[185846.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(715821.7500, grad_fn=<MseLossBackward>)
output :  tensor([[206260.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4245e+09, grad_fn=<MseLossBackward>)
output :  tensor([[112563.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(6570651., grad_fn=<MseLossBackward>)
output :  tensor([[171129.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(16802.6406, grad_fn=<MseLossBackward>)
output :  tensor([[132938.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(12686842., grad_fn=<MseLossBackward>)
output :  tensor([[127860.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1297570.1250, grad_fn=<MseLossBackward>)
output :  tensor([[122035.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(6430781., grad_fn=<MseLossBackward>)
output :  tensor([[146278.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5724e+08, grad_fn=<MseLossBackward>)
output :  tensor([[169483.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1175e+10, grad_fn=<MseLossBackward>)
output :  tensor([[150426.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(528347.2500, grad_fn=<MseLossBackward>)
output :  tensor([[178626.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1885472.2500, grad_fn=<MseLossBackward>)
output :  tensor([[142585.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2512918.5000, grad_fn=<MseLossBackward>)
output :  tensor([[105911.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5318e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135623.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3007e+09, grad_fn=<MseLossBackward>)
output :  tensor([[133253.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(3051626.7500, grad_fn=<MseLossBackward>)
output :  tensor([[135297.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(68842280., grad_fn=<MseLossBackward>)
output :  tensor([[226147.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1315931.6250, grad_fn=<MseLossBackward>)
output :  tensor([[133758.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2275902.2500, grad_fn=<MseLossBackward>)
output :  tensor([[154404.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(29210816., grad_fn=<MseLossBackward>)
output :  tensor([[113264.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1598367.6250, grad_fn=<MseLossBackward>)
output :  tensor([[163111.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(9683669., grad_fn=<MseLossBackward>)
output :  tensor([[145926.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4082e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194813.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(7918420., grad_fn=<MseLossBackward>)
output :  tensor([[134947.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(247832.8438, grad_fn=<MseLossBackward>)
output :  tensor([[119585.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(91887952., grad_fn=<MseLossBackward>)
output :  tensor([[231505.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(6220659.5000, grad_fn=<MseLossBackward>)
output :  tensor([[164987.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3525e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163089.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(16724394., grad_fn=<MseLossBackward>)
output :  tensor([[203321.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8621e+10, grad_fn=<MseLossBackward>)
output :  tensor([[248462.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1138e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143495.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(23.4619, grad_fn=<MseLossBackward>)
output :  tensor([[132613.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1921949., grad_fn=<MseLossBackward>)
output :  tensor([[156955.]], grad_fn=<AddmmBackward>)
loss:  tensor(3822025., grad_fn=<MseLossBackward>)
output :  tensor([[135196.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(27007510., grad_fn=<MseLossBackward>)
output :  tensor([[181937.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0937e+09, grad_fn=<MseLossBackward>)
output :  tensor([[179529.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(20890184., grad_fn=<MseLossBackward>)
output :  tensor([[164111.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(6819687.5000, grad_fn=<MseLossBackward>)
output :  tensor([[153842.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1757e+08, grad_fn=<MseLossBackward>)
output :  tensor([[141997.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(252867.5469, grad_fn=<MseLossBackward>)
output :  tensor([[141008.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(15932197., grad_fn=<MseLossBackward>)
output :  tensor([[171107.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7030e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194128.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2310e+08, grad_fn=<MseLossBackward>)
output :  tensor([[139460.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(8762248., grad_fn=<MseLossBackward>)
output :  tensor([[174444.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(6475196., grad_fn=<MseLossBackward>)
output :  tensor([[177027.]], grad_fn=<AddmmBackward>)
loss:  tensor(15784729., grad_fn=<MseLossBackward>)
output :  tensor([[117750.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(7565551., grad_fn=<MseLossBackward>)
output :  tensor([[221367.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(135033.2812, grad_fn=<MseLossBackward>)
output :  tensor([[178557.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(24424754., grad_fn=<MseLossBackward>)
output :  tensor([[123187.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(5346861.5000, grad_fn=<MseLossBackward>)
output :  tensor([[197118.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(382986.9375, grad_fn=<MseLossBackward>)
output :  tensor([[176141.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1542331.1250, grad_fn=<MseLossBackward>)
output :  tensor([[207297.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2024e+10, grad_fn=<MseLossBackward>)
output :  tensor([[209425.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2480379., grad_fn=<MseLossBackward>)
output :  tensor([[167840.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3573e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193474.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1052259.2500, grad_fn=<MseLossBackward>)
output :  tensor([[112750.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(62289.2422, grad_fn=<MseLossBackward>)
output :  tensor([[115521.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(9126630., grad_fn=<MseLossBackward>)
output :  tensor([[112712.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(507968.0312, grad_fn=<MseLossBackward>)
output :  tensor([[146871.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(5047.6582, grad_fn=<MseLossBackward>)
output :  tensor([[160279.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3256e+10, grad_fn=<MseLossBackward>)
output :  tensor([[180068.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(4722.2666, grad_fn=<MseLossBackward>)
output :  tensor([[128763.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1596195.3750, grad_fn=<MseLossBackward>)
output :  tensor([[144215.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(615685.4375, grad_fn=<MseLossBackward>)
output :  tensor([[187413.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7577e+09, grad_fn=<MseLossBackward>)
output :  tensor([[119978.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(9479519., grad_fn=<MseLossBackward>)
output :  tensor([[198471.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2166094., grad_fn=<MseLossBackward>)
output :  tensor([[147450.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(6005333., grad_fn=<MseLossBackward>)
output :  tensor([[213226.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(106857.4844, grad_fn=<MseLossBackward>)
output :  tensor([[125245.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(569836.2500, grad_fn=<MseLossBackward>)
output :  tensor([[246803.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2323766.7500, grad_fn=<MseLossBackward>)
output :  tensor([[235962.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4047e+09, grad_fn=<MseLossBackward>)
output :  tensor([[149263.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1909e+08, grad_fn=<MseLossBackward>)
output :  tensor([[85535.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0200e+08, grad_fn=<MseLossBackward>)
output :  tensor([[192694.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7578e+09, grad_fn=<MseLossBackward>)
output :  tensor([[81969.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(939839.3750, grad_fn=<MseLossBackward>)
output :  tensor([[140240.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(547808.1250, grad_fn=<MseLossBackward>)
output :  tensor([[79400.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(15216582., grad_fn=<MseLossBackward>)
output :  tensor([[142308.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(415420.5312, grad_fn=<MseLossBackward>)
output :  tensor([[176886.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(785716.0625, grad_fn=<MseLossBackward>)
output :  tensor([[153157.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(117563.2656, grad_fn=<MseLossBackward>)
output :  tensor([[108341.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(885804.5000, grad_fn=<MseLossBackward>)
output :  tensor([[202746.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2770e+10, grad_fn=<MseLossBackward>)
output :  tensor([[127502.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(995738.9375, grad_fn=<MseLossBackward>)
output :  tensor([[267860.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4738e+08, grad_fn=<MseLossBackward>)
output :  tensor([[306723.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(10732790., grad_fn=<MseLossBackward>)
output :  tensor([[108344.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(713444.1875, grad_fn=<MseLossBackward>)
output :  tensor([[169353.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(9899381., grad_fn=<MseLossBackward>)
output :  tensor([[135514.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5707e+08, grad_fn=<MseLossBackward>)
output :  tensor([[142733.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(13941472., grad_fn=<MseLossBackward>)
output :  tensor([[132420.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(4712020., grad_fn=<MseLossBackward>)
output :  tensor([[128956.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(15650987., grad_fn=<MseLossBackward>)
output :  tensor([[135196.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6031e+08, grad_fn=<MseLossBackward>)
output :  tensor([[228038.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8010e+10, grad_fn=<MseLossBackward>)
output :  tensor([[187327.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3615e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143690.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(44047.5156, grad_fn=<MseLossBackward>)
output :  tensor([[124535.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(8790993., grad_fn=<MseLossBackward>)
output :  tensor([[114687.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(11814473., grad_fn=<MseLossBackward>)
output :  tensor([[253903.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1162e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136070.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1145167.5000, grad_fn=<MseLossBackward>)
output :  tensor([[200614.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(5689492., grad_fn=<MseLossBackward>)
output :  tensor([[104320.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(336291.2500, grad_fn=<MseLossBackward>)
output :  tensor([[140455.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(255656.6406, grad_fn=<MseLossBackward>)
output :  tensor([[208687.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5005e+08, grad_fn=<MseLossBackward>)
output :  tensor([[185046.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(26484694., grad_fn=<MseLossBackward>)
output :  tensor([[187728.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(7446332.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163059.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1299e+10, grad_fn=<MseLossBackward>)
output :  tensor([[297539.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4033e+09, grad_fn=<MseLossBackward>)
output :  tensor([[197600.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(89606.6797, grad_fn=<MseLossBackward>)
output :  tensor([[261269.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0048e+10, grad_fn=<MseLossBackward>)
output :  tensor([[219157.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1942e+09, grad_fn=<MseLossBackward>)
output :  tensor([[280907.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3027e+09, grad_fn=<MseLossBackward>)
output :  tensor([[221737.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(5117139., grad_fn=<MseLossBackward>)
output :  tensor([[222876.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8603e+10, grad_fn=<MseLossBackward>)
output :  tensor([[193165.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(14702432., grad_fn=<MseLossBackward>)
output :  tensor([[159436.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2641e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134102.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2569258.2500, grad_fn=<MseLossBackward>)
output :  tensor([[133527.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(3891989.2500, grad_fn=<MseLossBackward>)
output :  tensor([[90911.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(7840.5488, grad_fn=<MseLossBackward>)
output :  tensor([[107525.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(224838.9688, grad_fn=<MseLossBackward>)
output :  tensor([[273454.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0742e+09, grad_fn=<MseLossBackward>)
output :  tensor([[232493.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(6283169., grad_fn=<MseLossBackward>)
output :  tensor([[146426.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2035348., grad_fn=<MseLossBackward>)
output :  tensor([[135842.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2747047.2500, grad_fn=<MseLossBackward>)
output :  tensor([[170138.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(12918858., grad_fn=<MseLossBackward>)
output :  tensor([[146069.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(671682.6875, grad_fn=<MseLossBackward>)
output :  tensor([[165552.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3795e+08, grad_fn=<MseLossBackward>)
output :  tensor([[168123.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(9754203., grad_fn=<MseLossBackward>)
output :  tensor([[135537.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2140277.5000, grad_fn=<MseLossBackward>)
output :  tensor([[191523.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7643e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113432.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2052459.1250, grad_fn=<MseLossBackward>)
output :  tensor([[174215.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4906779., grad_fn=<MseLossBackward>)
output :  tensor([[123703.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(13713713., grad_fn=<MseLossBackward>)
output :  tensor([[87804.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(646466.2500, grad_fn=<MseLossBackward>)
output :  tensor([[178784.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1477326.2500, grad_fn=<MseLossBackward>)
output :  tensor([[108719.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(1393488., grad_fn=<MseLossBackward>)
output :  tensor([[240350.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1824019.1250, grad_fn=<MseLossBackward>)
output :  tensor([[247426.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(5888433., grad_fn=<MseLossBackward>)
output :  tensor([[136759.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(52695348., grad_fn=<MseLossBackward>)
output :  tensor([[110456.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2241055.7500, grad_fn=<MseLossBackward>)
output :  tensor([[288453.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2112e+10, grad_fn=<MseLossBackward>)
output :  tensor([[175824.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(18697516., grad_fn=<MseLossBackward>)
output :  tensor([[126111.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(1235658., grad_fn=<MseLossBackward>)
output :  tensor([[143871.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6936e+08, grad_fn=<MseLossBackward>)
output :  tensor([[199136.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2093e+08, grad_fn=<MseLossBackward>)
output :  tensor([[142428.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2039630.2500, grad_fn=<MseLossBackward>)
output :  tensor([[157826.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4926e+10, grad_fn=<MseLossBackward>)
output :  tensor([[152991.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(826053.7500, grad_fn=<MseLossBackward>)
output :  tensor([[128596.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(816269.8750, grad_fn=<MseLossBackward>)
output :  tensor([[247329.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7206e+10, grad_fn=<MseLossBackward>)
output :  tensor([[397884.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(16937598., grad_fn=<MseLossBackward>)
output :  tensor([[108712.1016]], grad_fn=<AddmmBackward>)
loss:  tensor(82885.5078, grad_fn=<MseLossBackward>)
output :  tensor([[119434.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(873115.0625, grad_fn=<MseLossBackward>)
output :  tensor([[159467.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1070.5166, grad_fn=<MseLossBackward>)
output :  tensor([[133688.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1255e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163088.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4705e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174009.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0972e+09, grad_fn=<MseLossBackward>)
output :  tensor([[103998.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(158671.5156, grad_fn=<MseLossBackward>)
output :  tensor([[141460.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(212002.6875, grad_fn=<MseLossBackward>)
output :  tensor([[363585.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(13754595., grad_fn=<MseLossBackward>)
output :  tensor([[204744.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4261e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174350.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1321458., grad_fn=<MseLossBackward>)
output :  tensor([[203264.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(133202.1875, grad_fn=<MseLossBackward>)
output :  tensor([[139787.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(619861., grad_fn=<MseLossBackward>)
output :  tensor([[193578.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(848586.4375, grad_fn=<MseLossBackward>)
output :  tensor([[136231.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2550e+08, grad_fn=<MseLossBackward>)
output :  tensor([[182186.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1407040.7500, grad_fn=<MseLossBackward>)
output :  tensor([[237325.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(21853142., grad_fn=<MseLossBackward>)
output :  tensor([[172335.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2772173., grad_fn=<MseLossBackward>)
output :  tensor([[107841.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(25144.5449, grad_fn=<MseLossBackward>)
output :  tensor([[263622.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(879961.2500, grad_fn=<MseLossBackward>)
output :  tensor([[255396.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(29117660., grad_fn=<MseLossBackward>)
output :  tensor([[121829.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1368973.1250, grad_fn=<MseLossBackward>)
output :  tensor([[216312.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4443e+09, grad_fn=<MseLossBackward>)
output :  tensor([[305462.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9351e+08, grad_fn=<MseLossBackward>)
output :  tensor([[209373.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(5635208.5000, grad_fn=<MseLossBackward>)
output :  tensor([[216042.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5365e+10, grad_fn=<MseLossBackward>)
output :  tensor([[159946.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(4186947.2500, grad_fn=<MseLossBackward>)
output :  tensor([[172845.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(8152185., grad_fn=<MseLossBackward>)
output :  tensor([[158343.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1992067.6250, grad_fn=<MseLossBackward>)
output :  tensor([[169086.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(835110.3750, grad_fn=<MseLossBackward>)
output :  tensor([[237837.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(9.0979e+08, grad_fn=<MseLossBackward>)
output :  tensor([[216849.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5893e+08, grad_fn=<MseLossBackward>)
output :  tensor([[162861.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5160e+08, grad_fn=<MseLossBackward>)
output :  tensor([[121554.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2089334.7500, grad_fn=<MseLossBackward>)
output :  tensor([[177750.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(563133., grad_fn=<MseLossBackward>)
output :  tensor([[178748.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6019e+09, grad_fn=<MseLossBackward>)
output :  tensor([[206098.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5539e+10, grad_fn=<MseLossBackward>)
output :  tensor([[133599.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(693602.6875, grad_fn=<MseLossBackward>)
output :  tensor([[151404.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8832e+08, grad_fn=<MseLossBackward>)
output :  tensor([[279778.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(7719367.5000, grad_fn=<MseLossBackward>)
output :  tensor([[88857.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(14877594., grad_fn=<MseLossBackward>)
output :  tensor([[236891.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(153272.2500, grad_fn=<MseLossBackward>)
output :  tensor([[259093.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0487e+11, grad_fn=<MseLossBackward>)
output :  tensor([[166121.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(15044823., grad_fn=<MseLossBackward>)
output :  tensor([[195238.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5810e+09, grad_fn=<MseLossBackward>)
output :  tensor([[154967.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1062.3525, grad_fn=<MseLossBackward>)
output :  tensor([[205677.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1374e+09, grad_fn=<MseLossBackward>)
output :  tensor([[128525.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(225498.8438, grad_fn=<MseLossBackward>)
output :  tensor([[151011.]], grad_fn=<AddmmBackward>)
loss:  tensor(36132120., grad_fn=<MseLossBackward>)
output :  tensor([[169613.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3512e+08, grad_fn=<MseLossBackward>)
output :  tensor([[184282.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2456860.2500, grad_fn=<MseLossBackward>)
output :  tensor([[128476.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(6132549., grad_fn=<MseLossBackward>)
output :  tensor([[139644.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(9889649., grad_fn=<MseLossBackward>)
output :  tensor([[176734.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(13949291., grad_fn=<MseLossBackward>)
output :  tensor([[197061.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8024e+09, grad_fn=<MseLossBackward>)
output :  tensor([[237980.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(25200244., grad_fn=<MseLossBackward>)
output :  tensor([[154175.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(679259.2500, grad_fn=<MseLossBackward>)
output :  tensor([[201949.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(35393948., grad_fn=<MseLossBackward>)
output :  tensor([[165632.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6797e+08, grad_fn=<MseLossBackward>)
output :  tensor([[188810.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(86683080., grad_fn=<MseLossBackward>)
output :  tensor([[177357.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(6463591., grad_fn=<MseLossBackward>)
output :  tensor([[96685.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(98846.3750, grad_fn=<MseLossBackward>)
output :  tensor([[173948.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1247e+10, grad_fn=<MseLossBackward>)
output :  tensor([[135489.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(239182.1250, grad_fn=<MseLossBackward>)
output :  tensor([[123074.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(65197552., grad_fn=<MseLossBackward>)
output :  tensor([[169980.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(16154622., grad_fn=<MseLossBackward>)
output :  tensor([[86957.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3831928.5000, grad_fn=<MseLossBackward>)
output :  tensor([[289506.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(243326.3906, grad_fn=<MseLossBackward>)
output :  tensor([[171888.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(47445620., grad_fn=<MseLossBackward>)
output :  tensor([[193290.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9566e+10, grad_fn=<MseLossBackward>)
output :  tensor([[243026.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8251e+08, grad_fn=<MseLossBackward>)
output :  tensor([[151444.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(197441.3750, grad_fn=<MseLossBackward>)
output :  tensor([[121602.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(5746470.5000, grad_fn=<MseLossBackward>)
output :  tensor([[120071.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(29404.2109, grad_fn=<MseLossBackward>)
output :  tensor([[143352.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0388e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174681.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(464484.8438, grad_fn=<MseLossBackward>)
output :  tensor([[113575.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6572e+08, grad_fn=<MseLossBackward>)
output :  tensor([[212102.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1214e+10, grad_fn=<MseLossBackward>)
output :  tensor([[235284.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(38630692., grad_fn=<MseLossBackward>)
output :  tensor([[250532.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0926e+10, grad_fn=<MseLossBackward>)
output :  tensor([[220020.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6021e+08, grad_fn=<MseLossBackward>)
output :  tensor([[194494.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4642e+10, grad_fn=<MseLossBackward>)
output :  tensor([[187658.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(25166.8477, grad_fn=<MseLossBackward>)
output :  tensor([[207366.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7308e+10, grad_fn=<MseLossBackward>)
output :  tensor([[186408.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2378e+10, grad_fn=<MseLossBackward>)
output :  tensor([[179636.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(803320.0625, grad_fn=<MseLossBackward>)
output :  tensor([[153623.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2634687., grad_fn=<MseLossBackward>)
output :  tensor([[334067.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(8596991., grad_fn=<MseLossBackward>)
output :  tensor([[211077.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(850487.4375, grad_fn=<MseLossBackward>)
output :  tensor([[162690.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(7239967.5000, grad_fn=<MseLossBackward>)
output :  tensor([[186286.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0486e+09, grad_fn=<MseLossBackward>)
output :  tensor([[105714.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(510086.0938, grad_fn=<MseLossBackward>)
output :  tensor([[271858.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0169e+10, grad_fn=<MseLossBackward>)
output :  tensor([[172437.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2139454.7500, grad_fn=<MseLossBackward>)
output :  tensor([[210679.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(7955925.5000, grad_fn=<MseLossBackward>)
output :  tensor([[210216.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1628e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178154.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1093070.2500, grad_fn=<MseLossBackward>)
output :  tensor([[201385.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(172147.2031, grad_fn=<MseLossBackward>)
output :  tensor([[155308.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(95191.5312, grad_fn=<MseLossBackward>)
output :  tensor([[147578.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2637e+09, grad_fn=<MseLossBackward>)
output :  tensor([[118556.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3188.7197, grad_fn=<MseLossBackward>)
output :  tensor([[142238.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(5013051., grad_fn=<MseLossBackward>)
output :  tensor([[149919.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(845566.4375, grad_fn=<MseLossBackward>)
output :  tensor([[199254.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6575e+10, grad_fn=<MseLossBackward>)
output :  tensor([[161258.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3092981.7500, grad_fn=<MseLossBackward>)
output :  tensor([[99135.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(133110.9688, grad_fn=<MseLossBackward>)
output :  tensor([[225441.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1195e+08, grad_fn=<MseLossBackward>)
output :  tensor([[187372.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7840e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174881.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2570310.2500, grad_fn=<MseLossBackward>)
output :  tensor([[79120.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(8289810.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128631.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(17265.5488, grad_fn=<MseLossBackward>)
output :  tensor([[213975.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(599.4846, grad_fn=<MseLossBackward>)
output :  tensor([[142906.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1196220.7500, grad_fn=<MseLossBackward>)
output :  tensor([[135137.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(26396154., grad_fn=<MseLossBackward>)
output :  tensor([[143068.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(219301.9688, grad_fn=<MseLossBackward>)
output :  tensor([[177791.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6234e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144606.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(368126.5938, grad_fn=<MseLossBackward>)
output :  tensor([[159952.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2301.0010, grad_fn=<MseLossBackward>)
output :  tensor([[213534.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2146957.5000, grad_fn=<MseLossBackward>)
output :  tensor([[137055.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0276e+09, grad_fn=<MseLossBackward>)
output :  tensor([[255994.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(989900.6250, grad_fn=<MseLossBackward>)
output :  tensor([[157406.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4381041.5000, grad_fn=<MseLossBackward>)
output :  tensor([[130291.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(3208520.5000, grad_fn=<MseLossBackward>)
output :  tensor([[93304.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2873819.5000, grad_fn=<MseLossBackward>)
output :  tensor([[152777.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6618e+09, grad_fn=<MseLossBackward>)
output :  tensor([[178623.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1628814., grad_fn=<MseLossBackward>)
output :  tensor([[121074.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(329996.4062, grad_fn=<MseLossBackward>)
output :  tensor([[188800.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6119e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145044.]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2960e+09, grad_fn=<MseLossBackward>)
output :  tensor([[149204.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(484068.0625, grad_fn=<MseLossBackward>)
output :  tensor([[187647.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(10535.0977, grad_fn=<MseLossBackward>)
output :  tensor([[250676.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7978e+09, grad_fn=<MseLossBackward>)
output :  tensor([[92308.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(653230.1875, grad_fn=<MseLossBackward>)
output :  tensor([[239147.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(726516.5000, grad_fn=<MseLossBackward>)
output :  tensor([[130141.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2693496.5000, grad_fn=<MseLossBackward>)
output :  tensor([[166237.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9326e+09, grad_fn=<MseLossBackward>)
output :  tensor([[114014.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9641e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177773.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3146798.7500, grad_fn=<MseLossBackward>)
output :  tensor([[164777.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4404e+08, grad_fn=<MseLossBackward>)
output :  tensor([[154743.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8775e+08, grad_fn=<MseLossBackward>)
output :  tensor([[239831.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(691574.1250, grad_fn=<MseLossBackward>)
output :  tensor([[224720.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1075e+09, grad_fn=<MseLossBackward>)
output :  tensor([[128293.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1672374.3750, grad_fn=<MseLossBackward>)
output :  tensor([[125106.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(797630.3750, grad_fn=<MseLossBackward>)
output :  tensor([[224614.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(5688374., grad_fn=<MseLossBackward>)
output :  tensor([[231056.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(8665296., grad_fn=<MseLossBackward>)
output :  tensor([[228610.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3649890.7500, grad_fn=<MseLossBackward>)
output :  tensor([[149222.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1494964.7500, grad_fn=<MseLossBackward>)
output :  tensor([[210277.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(77006.2500, grad_fn=<MseLossBackward>)
output :  tensor([[131100.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2322e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135995.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(12219722., grad_fn=<MseLossBackward>)
output :  tensor([[311685.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(10983632., grad_fn=<MseLossBackward>)
output :  tensor([[139702.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1683060.2500, grad_fn=<MseLossBackward>)
output :  tensor([[121216.1016]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9394e+09, grad_fn=<MseLossBackward>)
output :  tensor([[108688.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(658316.6875, grad_fn=<MseLossBackward>)
output :  tensor([[155271.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9683e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177956.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(9.3640e+09, grad_fn=<MseLossBackward>)
output :  tensor([[175899.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(8408913., grad_fn=<MseLossBackward>)
output :  tensor([[190015.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2066e+08, grad_fn=<MseLossBackward>)
output :  tensor([[91213.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(77210136., grad_fn=<MseLossBackward>)
output :  tensor([[179477.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(227543.9062, grad_fn=<MseLossBackward>)
output :  tensor([[169533.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2669854., grad_fn=<MseLossBackward>)
output :  tensor([[139960.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(923340.8125, grad_fn=<MseLossBackward>)
output :  tensor([[257030.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0418e+10, grad_fn=<MseLossBackward>)
output :  tensor([[141806.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2270e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173578.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(335132.4375, grad_fn=<MseLossBackward>)
output :  tensor([[139748.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(63291.5547, grad_fn=<MseLossBackward>)
output :  tensor([[195860.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(21526410., grad_fn=<MseLossBackward>)
output :  tensor([[168459.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2372851.5000, grad_fn=<MseLossBackward>)
output :  tensor([[245931.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3728881.7500, grad_fn=<MseLossBackward>)
output :  tensor([[135402.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(814534.4375, grad_fn=<MseLossBackward>)
output :  tensor([[152393.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(9264604., grad_fn=<MseLossBackward>)
output :  tensor([[215411.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(169280.8125, grad_fn=<MseLossBackward>)
output :  tensor([[167133.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4553556., grad_fn=<MseLossBackward>)
output :  tensor([[195642.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(44128412., grad_fn=<MseLossBackward>)
output :  tensor([[132116.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2273e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130840.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(3385628.7500, grad_fn=<MseLossBackward>)
output :  tensor([[138140.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(3456520., grad_fn=<MseLossBackward>)
output :  tensor([[198896.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9849e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166970.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7009e+09, grad_fn=<MseLossBackward>)
output :  tensor([[78113.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2809e+08, grad_fn=<MseLossBackward>)
output :  tensor([[92482.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(63719308., grad_fn=<MseLossBackward>)
output :  tensor([[249862.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(11765222., grad_fn=<MseLossBackward>)
output :  tensor([[205117.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3715e+09, grad_fn=<MseLossBackward>)
output :  tensor([[114372.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(393256.3750, grad_fn=<MseLossBackward>)
output :  tensor([[155945.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9566e+08, grad_fn=<MseLossBackward>)
output :  tensor([[207830.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4811e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178947.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2906e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158456.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(11945124., grad_fn=<MseLossBackward>)
output :  tensor([[165368.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(21453688., grad_fn=<MseLossBackward>)
output :  tensor([[115452.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(205025.0156, grad_fn=<MseLossBackward>)
output :  tensor([[161972.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(48612272., grad_fn=<MseLossBackward>)
output :  tensor([[194047.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6520e+08, grad_fn=<MseLossBackward>)
output :  tensor([[214193.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(28162756., grad_fn=<MseLossBackward>)
output :  tensor([[247463.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4754e+11, grad_fn=<MseLossBackward>)
output :  tensor([[146173.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(683567.2500, grad_fn=<MseLossBackward>)
output :  tensor([[113446.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(24666122., grad_fn=<MseLossBackward>)
output :  tensor([[171749.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0304e+08, grad_fn=<MseLossBackward>)
output :  tensor([[153066.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(6587644., grad_fn=<MseLossBackward>)
output :  tensor([[234636.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(5585393.5000, grad_fn=<MseLossBackward>)
output :  tensor([[116065.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(1134574.5000, grad_fn=<MseLossBackward>)
output :  tensor([[177432.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(29892360., grad_fn=<MseLossBackward>)
output :  tensor([[184883.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(3298083., grad_fn=<MseLossBackward>)
output :  tensor([[165825.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3770e+10, grad_fn=<MseLossBackward>)
output :  tensor([[96423.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3790e+08, grad_fn=<MseLossBackward>)
output :  tensor([[246719.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(59592612., grad_fn=<MseLossBackward>)
output :  tensor([[178891.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(8362670., grad_fn=<MseLossBackward>)
output :  tensor([[141947.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(3791478.2500, grad_fn=<MseLossBackward>)
output :  tensor([[234759.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(57682.5312, grad_fn=<MseLossBackward>)
output :  tensor([[167784.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(22888450., grad_fn=<MseLossBackward>)
output :  tensor([[202141.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5094e+10, grad_fn=<MseLossBackward>)
output :  tensor([[132563.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(5934781., grad_fn=<MseLossBackward>)
output :  tensor([[188185.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8570e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136802.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(644733.7500, grad_fn=<MseLossBackward>)
output :  tensor([[224938.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2235e+08, grad_fn=<MseLossBackward>)
output :  tensor([[228586.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5855e+08, grad_fn=<MseLossBackward>)
output :  tensor([[88005.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(3976067.2500, grad_fn=<MseLossBackward>)
output :  tensor([[161440.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(4025791.5000, grad_fn=<MseLossBackward>)
output :  tensor([[244040.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6088e+10, grad_fn=<MseLossBackward>)
output :  tensor([[148452.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(11919648., grad_fn=<MseLossBackward>)
output :  tensor([[109729.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8258e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163405.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1198717., grad_fn=<MseLossBackward>)
output :  tensor([[143117.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(778227.1875, grad_fn=<MseLossBackward>)
output :  tensor([[128968.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(590808.4375, grad_fn=<MseLossBackward>)
output :  tensor([[189957.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7669e+09, grad_fn=<MseLossBackward>)
output :  tensor([[124122.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(2632633., grad_fn=<MseLossBackward>)
output :  tensor([[150322.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2813167.5000, grad_fn=<MseLossBackward>)
output :  tensor([[166594.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(26580792., grad_fn=<MseLossBackward>)
output :  tensor([[152530.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2341856.2500, grad_fn=<MseLossBackward>)
output :  tensor([[161673.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1504187.2500, grad_fn=<MseLossBackward>)
output :  tensor([[136179.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3873e+08, grad_fn=<MseLossBackward>)
output :  tensor([[132269.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(72647.0938, grad_fn=<MseLossBackward>)
output :  tensor([[154897.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5272e+08, grad_fn=<MseLossBackward>)
output :  tensor([[146266.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(4469194., grad_fn=<MseLossBackward>)
output :  tensor([[163393.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2701862.7500, grad_fn=<MseLossBackward>)
output :  tensor([[135734.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6745e+08, grad_fn=<MseLossBackward>)
output :  tensor([[150069.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1611273.2500, grad_fn=<MseLossBackward>)
output :  tensor([[185382.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(6849507., grad_fn=<MseLossBackward>)
output :  tensor([[170373.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1886588.1250, grad_fn=<MseLossBackward>)
output :  tensor([[179181.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(670607.4375, grad_fn=<MseLossBackward>)
output :  tensor([[219162.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(702165.4375, grad_fn=<MseLossBackward>)
output :  tensor([[109773.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(3508655.7500, grad_fn=<MseLossBackward>)
output :  tensor([[136797.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4156e+08, grad_fn=<MseLossBackward>)
output :  tensor([[284347.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2730859.5000, grad_fn=<MseLossBackward>)
output :  tensor([[120475.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(20028072., grad_fn=<MseLossBackward>)
output :  tensor([[178601.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7139e+09, grad_fn=<MseLossBackward>)
output :  tensor([[187024.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(4099233., grad_fn=<MseLossBackward>)
output :  tensor([[180516.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(24832470., grad_fn=<MseLossBackward>)
output :  tensor([[249886.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3067e+08, grad_fn=<MseLossBackward>)
output :  tensor([[217709.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(18405440., grad_fn=<MseLossBackward>)
output :  tensor([[126651.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3062e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175486.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0562e+08, grad_fn=<MseLossBackward>)
output :  tensor([[126779.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(7725273., grad_fn=<MseLossBackward>)
output :  tensor([[181283.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6305e+10, grad_fn=<MseLossBackward>)
output :  tensor([[150489.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(6303944., grad_fn=<MseLossBackward>)
output :  tensor([[155893.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(88242248., grad_fn=<MseLossBackward>)
output :  tensor([[201338.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(24618342., grad_fn=<MseLossBackward>)
output :  tensor([[144986.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5592e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174335.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2769624., grad_fn=<MseLossBackward>)
output :  tensor([[252060.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5291e+08, grad_fn=<MseLossBackward>)
output :  tensor([[147114.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(784276.3125, grad_fn=<MseLossBackward>)
output :  tensor([[198888.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(14265611., grad_fn=<MseLossBackward>)
output :  tensor([[160309.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(129094.2422, grad_fn=<MseLossBackward>)
output :  tensor([[125065.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3739e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136978.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1509365.8750, grad_fn=<MseLossBackward>)
output :  tensor([[184574.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(329583.6250, grad_fn=<MseLossBackward>)
output :  tensor([[198109.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(65766016., grad_fn=<MseLossBackward>)
output :  tensor([[229613.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5268e+09, grad_fn=<MseLossBackward>)
output :  tensor([[252698.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(18506532., grad_fn=<MseLossBackward>)
output :  tensor([[184796.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8011e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144065.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7631e+09, grad_fn=<MseLossBackward>)
output :  tensor([[143620.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(773630.1875, grad_fn=<MseLossBackward>)
output :  tensor([[71423.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(9.8743e+08, grad_fn=<MseLossBackward>)
output :  tensor([[126672.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(69353632., grad_fn=<MseLossBackward>)
output :  tensor([[128197.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(494000.3125, grad_fn=<MseLossBackward>)
output :  tensor([[154524.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(275100.2500, grad_fn=<MseLossBackward>)
output :  tensor([[129602.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(6772152.5000, grad_fn=<MseLossBackward>)
output :  tensor([[79538.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(9230204., grad_fn=<MseLossBackward>)
output :  tensor([[82317.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(100662.4375, grad_fn=<MseLossBackward>)
output :  tensor([[234032.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(4130230.5000, grad_fn=<MseLossBackward>)
output :  tensor([[142190.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8150e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130844.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(118691.0156, grad_fn=<MseLossBackward>)
output :  tensor([[173129.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(37576132., grad_fn=<MseLossBackward>)
output :  tensor([[235925.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(856752.6875, grad_fn=<MseLossBackward>)
output :  tensor([[189320.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(7947818., grad_fn=<MseLossBackward>)
output :  tensor([[159272.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(10709359., grad_fn=<MseLossBackward>)
output :  tensor([[196241.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2751296., grad_fn=<MseLossBackward>)
output :  tensor([[199894.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3768e+09, grad_fn=<MseLossBackward>)
output :  tensor([[135985.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1029178.5625, grad_fn=<MseLossBackward>)
output :  tensor([[154688.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(96934.9297, grad_fn=<MseLossBackward>)
output :  tensor([[136728.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(530598.4375, grad_fn=<MseLossBackward>)
output :  tensor([[198482.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9338e+08, grad_fn=<MseLossBackward>)
output :  tensor([[153861.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(19281.9258, grad_fn=<MseLossBackward>)
output :  tensor([[137489.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9350e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146794.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3587354.5000, grad_fn=<MseLossBackward>)
output :  tensor([[204743.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(52663824., grad_fn=<MseLossBackward>)
output :  tensor([[103139.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4687e+08, grad_fn=<MseLossBackward>)
output :  tensor([[164735.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(7640128., grad_fn=<MseLossBackward>)
output :  tensor([[127414.1016]], grad_fn=<AddmmBackward>)
loss:  tensor(343276.9688, grad_fn=<MseLossBackward>)
output :  tensor([[146034.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(931918.7500, grad_fn=<MseLossBackward>)
output :  tensor([[107304.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0179e+09, grad_fn=<MseLossBackward>)
output :  tensor([[138026.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(276856.8438, grad_fn=<MseLossBackward>)
output :  tensor([[235834.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(27441.9922, grad_fn=<MseLossBackward>)
output :  tensor([[143508.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2224572.2500, grad_fn=<MseLossBackward>)
output :  tensor([[139476.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3906428.7500, grad_fn=<MseLossBackward>)
output :  tensor([[164004.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2963e+09, grad_fn=<MseLossBackward>)
output :  tensor([[270245.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(60132756., grad_fn=<MseLossBackward>)
output :  tensor([[177244.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(5039393.5000, grad_fn=<MseLossBackward>)
output :  tensor([[102380.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(156278.1562, grad_fn=<MseLossBackward>)
output :  tensor([[203320.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5026e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159917.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(840975., grad_fn=<MseLossBackward>)
output :  tensor([[163622.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5712e+10, grad_fn=<MseLossBackward>)
output :  tensor([[100966.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(7108431., grad_fn=<MseLossBackward>)
output :  tensor([[123996.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(156834.5625, grad_fn=<MseLossBackward>)
output :  tensor([[156481.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(232007.7969, grad_fn=<MseLossBackward>)
output :  tensor([[142239.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(5015010.5000, grad_fn=<MseLossBackward>)
output :  tensor([[201278.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1634402.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140704.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1679575.5000, grad_fn=<MseLossBackward>)
output :  tensor([[265184.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(8433398., grad_fn=<MseLossBackward>)
output :  tensor([[129690.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3462e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166476.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(953979.5000, grad_fn=<MseLossBackward>)
output :  tensor([[186279.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(4932008., grad_fn=<MseLossBackward>)
output :  tensor([[126815.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8275e+08, grad_fn=<MseLossBackward>)
output :  tensor([[246406.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(12911333., grad_fn=<MseLossBackward>)
output :  tensor([[158135.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3318e+08, grad_fn=<MseLossBackward>)
output :  tensor([[244344.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1010653.2500, grad_fn=<MseLossBackward>)
output :  tensor([[143901.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(9779.3555, grad_fn=<MseLossBackward>)
output :  tensor([[210229.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(52534.0742, grad_fn=<MseLossBackward>)
output :  tensor([[178991.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(43441900., grad_fn=<MseLossBackward>)
output :  tensor([[155996.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(3986074.7500, grad_fn=<MseLossBackward>)
output :  tensor([[118475.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(226204.2812, grad_fn=<MseLossBackward>)
output :  tensor([[234771.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7373e+09, grad_fn=<MseLossBackward>)
output :  tensor([[238022.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(3910753.5000, grad_fn=<MseLossBackward>)
output :  tensor([[152305.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1064733.7500, grad_fn=<MseLossBackward>)
output :  tensor([[255924.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1048992., grad_fn=<MseLossBackward>)
output :  tensor([[123829.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(86961304., grad_fn=<MseLossBackward>)
output :  tensor([[175329.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(449549.3125, grad_fn=<MseLossBackward>)
output :  tensor([[159974.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(671.9436, grad_fn=<MseLossBackward>)
output :  tensor([[132048.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1099286.7500, grad_fn=<MseLossBackward>)
output :  tensor([[194955.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2844e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163318.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(464208., grad_fn=<MseLossBackward>)
output :  tensor([[166149.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(9920827., grad_fn=<MseLossBackward>)
output :  tensor([[158229.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(52584.2227, grad_fn=<MseLossBackward>)
output :  tensor([[146817.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(9501036., grad_fn=<MseLossBackward>)
output :  tensor([[174167.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1819e+09, grad_fn=<MseLossBackward>)
output :  tensor([[160448.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(200914.0625, grad_fn=<MseLossBackward>)
output :  tensor([[378078.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(34708668., grad_fn=<MseLossBackward>)
output :  tensor([[126701.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(89195.5547, grad_fn=<MseLossBackward>)
output :  tensor([[129162.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9064e+09, grad_fn=<MseLossBackward>)
output :  tensor([[277776.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(11807599., grad_fn=<MseLossBackward>)
output :  tensor([[163175.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1382645.2500, grad_fn=<MseLossBackward>)
output :  tensor([[132772.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5062e+08, grad_fn=<MseLossBackward>)
output :  tensor([[226913.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(25874230., grad_fn=<MseLossBackward>)
output :  tensor([[181097.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(357230.3438, grad_fn=<MseLossBackward>)
output :  tensor([[154421.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(5865100., grad_fn=<MseLossBackward>)
output :  tensor([[146364.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1860794.3750, grad_fn=<MseLossBackward>)
output :  tensor([[154391.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0597e+08, grad_fn=<MseLossBackward>)
output :  tensor([[98438.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(2438599.5000, grad_fn=<MseLossBackward>)
output :  tensor([[75704.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4664e+08, grad_fn=<MseLossBackward>)
output :  tensor([[162836.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(4679650.5000, grad_fn=<MseLossBackward>)
output :  tensor([[187849.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6121e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158558.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(311695.4062, grad_fn=<MseLossBackward>)
output :  tensor([[156539.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(922560.2500, grad_fn=<MseLossBackward>)
output :  tensor([[138622.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1375086., grad_fn=<MseLossBackward>)
output :  tensor([[205565.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(147876.2969, grad_fn=<MseLossBackward>)
output :  tensor([[138420.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(176478.7656, grad_fn=<MseLossBackward>)
output :  tensor([[181687.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6464e+10, grad_fn=<MseLossBackward>)
output :  tensor([[147395.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1947245.8750, grad_fn=<MseLossBackward>)
output :  tensor([[109511.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0288e+08, grad_fn=<MseLossBackward>)
output :  tensor([[91844.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(4644833., grad_fn=<MseLossBackward>)
output :  tensor([[177894.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(8375959.5000, grad_fn=<MseLossBackward>)
output :  tensor([[254262.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(37666796., grad_fn=<MseLossBackward>)
output :  tensor([[140561.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(880137.1250, grad_fn=<MseLossBackward>)
output :  tensor([[159143.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(564634.8125, grad_fn=<MseLossBackward>)
output :  tensor([[130954.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(2387242.2500, grad_fn=<MseLossBackward>)
output :  tensor([[150375.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(765761.7500, grad_fn=<MseLossBackward>)
output :  tensor([[169394.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2233950.5000, grad_fn=<MseLossBackward>)
output :  tensor([[130757.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(14116164., grad_fn=<MseLossBackward>)
output :  tensor([[173100.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8965e+08, grad_fn=<MseLossBackward>)
output :  tensor([[157566.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(321117., grad_fn=<MseLossBackward>)
output :  tensor([[116367.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(17469.4043, grad_fn=<MseLossBackward>)
output :  tensor([[159010.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4744e+09, grad_fn=<MseLossBackward>)
output :  tensor([[53328.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(1765099.1250, grad_fn=<MseLossBackward>)
output :  tensor([[234400.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0996e+09, grad_fn=<MseLossBackward>)
output :  tensor([[197664.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(11126498., grad_fn=<MseLossBackward>)
output :  tensor([[181744.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(10599705., grad_fn=<MseLossBackward>)
output :  tensor([[106777.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(604263.3125, grad_fn=<MseLossBackward>)
output :  tensor([[86652.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(120604.2656, grad_fn=<MseLossBackward>)
output :  tensor([[140048.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2399.4690, grad_fn=<MseLossBackward>)
output :  tensor([[220408.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4157e+09, grad_fn=<MseLossBackward>)
output :  tensor([[203537.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(15702521., grad_fn=<MseLossBackward>)
output :  tensor([[165409.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(167549.5156, grad_fn=<MseLossBackward>)
output :  tensor([[173037.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4570e+09, grad_fn=<MseLossBackward>)
output :  tensor([[191211.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1467618.6250, grad_fn=<MseLossBackward>)
output :  tensor([[90570.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(12750702., grad_fn=<MseLossBackward>)
output :  tensor([[139326.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(454086.4688, grad_fn=<MseLossBackward>)
output :  tensor([[114191.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(13624404., grad_fn=<MseLossBackward>)
output :  tensor([[145388.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(88890128., grad_fn=<MseLossBackward>)
output :  tensor([[172156.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6939e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194787.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0430e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180027.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(758.8303, grad_fn=<MseLossBackward>)
output :  tensor([[100846.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(18891384., grad_fn=<MseLossBackward>)
output :  tensor([[118514.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(1028243.5625, grad_fn=<MseLossBackward>)
output :  tensor([[160922.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3258e+08, grad_fn=<MseLossBackward>)
output :  tensor([[199831.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(28518.7656, grad_fn=<MseLossBackward>)
output :  tensor([[144052.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2730.0625, grad_fn=<MseLossBackward>)
train_loss: [2.6158817e+09]
epoch_result tensor([0.])
output :  tensor([[157897.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(362441.6250, grad_fn=<MseLossBackward>)
output :  tensor([[123406.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(1979539.1250, grad_fn=<MseLossBackward>)
output :  tensor([[194844.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(414192.8125, grad_fn=<MseLossBackward>)
output :  tensor([[177998.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(996971.0625, grad_fn=<MseLossBackward>)
output :  tensor([[153860.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8271e+08, grad_fn=<MseLossBackward>)
output :  tensor([[127454.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(297706.6250, grad_fn=<MseLossBackward>)
output :  tensor([[141814.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(664148.6250, grad_fn=<MseLossBackward>)
output :  tensor([[117674.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1757157.3750, grad_fn=<MseLossBackward>)
output :  tensor([[67123.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(74371352., grad_fn=<MseLossBackward>)
output :  tensor([[165097.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(813801.3125, grad_fn=<MseLossBackward>)
output :  tensor([[143250.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(10567376., grad_fn=<MseLossBackward>)
output :  tensor([[225379.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(144032.1094, grad_fn=<MseLossBackward>)
output :  tensor([[166321.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(7176873.5000, grad_fn=<MseLossBackward>)
output :  tensor([[247660.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(4160452.5000, grad_fn=<MseLossBackward>)
output :  tensor([[55205.3242]], grad_fn=<AddmmBackward>)
loss:  tensor(42158.0352, grad_fn=<MseLossBackward>)
output :  tensor([[161949.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0447e+08, grad_fn=<MseLossBackward>)
output :  tensor([[170618.]], grad_fn=<AddmmBackward>)
loss:  tensor(19201924., grad_fn=<MseLossBackward>)
output :  tensor([[161241.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(22479304., grad_fn=<MseLossBackward>)
output :  tensor([[273672.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1761426.6250, grad_fn=<MseLossBackward>)
output :  tensor([[197895.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(802396.0625, grad_fn=<MseLossBackward>)
output :  tensor([[136870.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5971e+10, grad_fn=<MseLossBackward>)
output :  tensor([[194961.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1172178.3750, grad_fn=<MseLossBackward>)
output :  tensor([[178389.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1633e+09, grad_fn=<MseLossBackward>)
output :  tensor([[152163.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1354277.7500, grad_fn=<MseLossBackward>)
output :  tensor([[169830.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(28629.6973, grad_fn=<MseLossBackward>)
output :  tensor([[86756.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(1839859.1250, grad_fn=<MseLossBackward>)
output :  tensor([[169436.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1851e+09, grad_fn=<MseLossBackward>)
output :  tensor([[182799.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(4843988.5000, grad_fn=<MseLossBackward>)
output :  tensor([[205838.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4663e+09, grad_fn=<MseLossBackward>)
output :  tensor([[110554.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(307444.2500, grad_fn=<MseLossBackward>)
output :  tensor([[170690.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(95751.5625, grad_fn=<MseLossBackward>)
output :  tensor([[138497.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(3990193.5000, grad_fn=<MseLossBackward>)
output :  tensor([[130746.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(3048679.7500, grad_fn=<MseLossBackward>)
output :  tensor([[121503.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(4014231.5000, grad_fn=<MseLossBackward>)
output :  tensor([[147155.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(9.0934e+08, grad_fn=<MseLossBackward>)
output :  tensor([[167491.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1759e+10, grad_fn=<MseLossBackward>)
output :  tensor([[151317.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2617570., grad_fn=<MseLossBackward>)
output :  tensor([[182263.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(5121876., grad_fn=<MseLossBackward>)
output :  tensor([[140622.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(142801.3281, grad_fn=<MseLossBackward>)
output :  tensor([[106985.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8852e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136302.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1933e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136734.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(3009628.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139199.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4884e+08, grad_fn=<MseLossBackward>)
output :  tensor([[223631.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1872492.8750, grad_fn=<MseLossBackward>)
output :  tensor([[132589.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(115302.6875, grad_fn=<MseLossBackward>)
output :  tensor([[146608.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(5721365., grad_fn=<MseLossBackward>)
output :  tensor([[108938.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(9372113., grad_fn=<MseLossBackward>)
output :  tensor([[158816.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1399526., grad_fn=<MseLossBackward>)
output :  tensor([[147535.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2529e+09, grad_fn=<MseLossBackward>)
output :  tensor([[189372.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(6903428., grad_fn=<MseLossBackward>)
output :  tensor([[135143.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(481592.6250, grad_fn=<MseLossBackward>)
output :  tensor([[109167.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(693511.6250, grad_fn=<MseLossBackward>)
output :  tensor([[235475.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2177653.5000, grad_fn=<MseLossBackward>)
output :  tensor([[165617.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2918e+09, grad_fn=<MseLossBackward>)
output :  tensor([[153207.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(33548532., grad_fn=<MseLossBackward>)
output :  tensor([[203005.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8728e+10, grad_fn=<MseLossBackward>)
output :  tensor([[241476.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2662e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145235.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3013424.7500, grad_fn=<MseLossBackward>)
output :  tensor([[141622.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(58096076., grad_fn=<MseLossBackward>)
output :  tensor([[154300.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(489693.8125, grad_fn=<MseLossBackward>)
output :  tensor([[132918.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(8517825., grad_fn=<MseLossBackward>)
output :  tensor([[181051.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2329e+09, grad_fn=<MseLossBackward>)
output :  tensor([[181353.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(7544464., grad_fn=<MseLossBackward>)
output :  tensor([[162494.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(988719.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139001.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(15986128., grad_fn=<MseLossBackward>)
output :  tensor([[145362.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(8191133.5000, grad_fn=<MseLossBackward>)
output :  tensor([[147609.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(6807696.5000, grad_fn=<MseLossBackward>)
output :  tensor([[172903.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4599e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193977.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3004e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136473.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(677.6260, grad_fn=<MseLossBackward>)
output :  tensor([[170391.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2275195.2500, grad_fn=<MseLossBackward>)
output :  tensor([[179877.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1260918.5000, grad_fn=<MseLossBackward>)
output :  tensor([[115828.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(685946.3125, grad_fn=<MseLossBackward>)
output :  tensor([[216299.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(22094554., grad_fn=<MseLossBackward>)
output :  tensor([[180638.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(8190239., grad_fn=<MseLossBackward>)
output :  tensor([[127663.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(4679583., grad_fn=<MseLossBackward>)
output :  tensor([[192575.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(15405012., grad_fn=<MseLossBackward>)
output :  tensor([[170453.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(19770250., grad_fn=<MseLossBackward>)
output :  tensor([[211826.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0423e+10, grad_fn=<MseLossBackward>)
output :  tensor([[209036.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(3857234.7500, grad_fn=<MseLossBackward>)
output :  tensor([[167312.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3186e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193899.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(360675.3125, grad_fn=<MseLossBackward>)
output :  tensor([[113831.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(692016., grad_fn=<MseLossBackward>)
output :  tensor([[116056.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(12651804., grad_fn=<MseLossBackward>)
output :  tensor([[114136.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(4564098., grad_fn=<MseLossBackward>)
output :  tensor([[144556.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(5034274., grad_fn=<MseLossBackward>)
output :  tensor([[158591.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3875e+10, grad_fn=<MseLossBackward>)
output :  tensor([[179978.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(469.6702, grad_fn=<MseLossBackward>)
output :  tensor([[125814.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2840489., grad_fn=<MseLossBackward>)
output :  tensor([[146691.]], grad_fn=<AddmmBackward>)
loss:  tensor(2859481., grad_fn=<MseLossBackward>)
output :  tensor([[183010.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3146e+09, grad_fn=<MseLossBackward>)
output :  tensor([[117710.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(656188.6250, grad_fn=<MseLossBackward>)
output :  tensor([[193437.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(12689959., grad_fn=<MseLossBackward>)
output :  tensor([[141284.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(13802618., grad_fn=<MseLossBackward>)
output :  tensor([[212534.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(133327.6719, grad_fn=<MseLossBackward>)
output :  tensor([[128827.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(7993828.5000, grad_fn=<MseLossBackward>)
output :  tensor([[252405.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(16622948., grad_fn=<MseLossBackward>)
output :  tensor([[237165.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2881e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150406.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6125e+08, grad_fn=<MseLossBackward>)
output :  tensor([[84738.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6354e+08, grad_fn=<MseLossBackward>)
output :  tensor([[191775.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9097e+09, grad_fn=<MseLossBackward>)
output :  tensor([[79182.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(3303135.7500, grad_fn=<MseLossBackward>)
output :  tensor([[138758.]], grad_fn=<AddmmBackward>)
loss:  tensor(550564., grad_fn=<MseLossBackward>)
output :  tensor([[78349.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(8120006.5000, grad_fn=<MseLossBackward>)
output :  tensor([[143407.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(206527.6406, grad_fn=<MseLossBackward>)
output :  tensor([[171727.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(18257994., grad_fn=<MseLossBackward>)
output :  tensor([[151746.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(3073995.2500, grad_fn=<MseLossBackward>)
output :  tensor([[109054.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(2736362.2500, grad_fn=<MseLossBackward>)
output :  tensor([[204653.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2343e+10, grad_fn=<MseLossBackward>)
output :  tensor([[132430.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(15449076., grad_fn=<MseLossBackward>)
output :  tensor([[267408.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5855e+08, grad_fn=<MseLossBackward>)
output :  tensor([[304973.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(25269472., grad_fn=<MseLossBackward>)
output :  tensor([[106549.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(903732.4375, grad_fn=<MseLossBackward>)
output :  tensor([[170077.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(5869414.5000, grad_fn=<MseLossBackward>)
output :  tensor([[133294.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3981e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136873.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(4521470.5000, grad_fn=<MseLossBackward>)
output :  tensor([[131826.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2486682.5000, grad_fn=<MseLossBackward>)
output :  tensor([[126517.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(2304252.7500, grad_fn=<MseLossBackward>)
output :  tensor([[135253.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6323e+08, grad_fn=<MseLossBackward>)
output :  tensor([[227156.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8355e+10, grad_fn=<MseLossBackward>)
output :  tensor([[191293.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2412e+10, grad_fn=<MseLossBackward>)
output :  tensor([[147752.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(14839349., grad_fn=<MseLossBackward>)
output :  tensor([[126120.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1901813.3750, grad_fn=<MseLossBackward>)
output :  tensor([[112933.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(2833251.7500, grad_fn=<MseLossBackward>)
output :  tensor([[256577.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7803e+09, grad_fn=<MseLossBackward>)
output :  tensor([[135230.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(53267.1992, grad_fn=<MseLossBackward>)
output :  tensor([[209561.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(43057588., grad_fn=<MseLossBackward>)
output :  tensor([[112368.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(55777560., grad_fn=<MseLossBackward>)
output :  tensor([[139491.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(210279.5625, grad_fn=<MseLossBackward>)
output :  tensor([[205567.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5843e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181432.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2349274.7500, grad_fn=<MseLossBackward>)
output :  tensor([[186278.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1634682.1250, grad_fn=<MseLossBackward>)
output :  tensor([[164089.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0999e+10, grad_fn=<MseLossBackward>)
output :  tensor([[300690.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1772e+09, grad_fn=<MseLossBackward>)
output :  tensor([[196931.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(937054.2500, grad_fn=<MseLossBackward>)
output :  tensor([[262810.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9614e+10, grad_fn=<MseLossBackward>)
output :  tensor([[221141.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0122e+09, grad_fn=<MseLossBackward>)
output :  tensor([[280981.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2974e+09, grad_fn=<MseLossBackward>)
output :  tensor([[225583.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2507521.7500, grad_fn=<MseLossBackward>)
output :  tensor([[220360.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9460e+10, grad_fn=<MseLossBackward>)
output :  tensor([[199202.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(4849010.5000, grad_fn=<MseLossBackward>)
output :  tensor([[159572.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(9.3469e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130969.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(2341736.7500, grad_fn=<MseLossBackward>)
output :  tensor([[133862.]], grad_fn=<AddmmBackward>)
loss:  tensor(2683044., grad_fn=<MseLossBackward>)
output :  tensor([[90834.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(27317.8906, grad_fn=<MseLossBackward>)
output :  tensor([[108621.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(386155.4375, grad_fn=<MseLossBackward>)
output :  tensor([[273913.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0235e+09, grad_fn=<MseLossBackward>)
output :  tensor([[236009.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1019879.0625, grad_fn=<MseLossBackward>)
output :  tensor([[144686.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(98037.4844, grad_fn=<MseLossBackward>)
output :  tensor([[140655.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(9958857., grad_fn=<MseLossBackward>)
output :  tensor([[176626.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(8370262.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139582.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(32117900., grad_fn=<MseLossBackward>)
output :  tensor([[165262.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5484e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166253.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1571458.1250, grad_fn=<MseLossBackward>)
output :  tensor([[134857.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(4592248., grad_fn=<MseLossBackward>)
output :  tensor([[188192.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3155e+09, grad_fn=<MseLossBackward>)
output :  tensor([[112518.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(268566.8750, grad_fn=<MseLossBackward>)
output :  tensor([[164446.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(57052292., grad_fn=<MseLossBackward>)
output :  tensor([[120758.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(575523.7500, grad_fn=<MseLossBackward>)
output :  tensor([[87334.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(111916.3828, grad_fn=<MseLossBackward>)
output :  tensor([[179669.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(109457.5859, grad_fn=<MseLossBackward>)
output :  tensor([[113491.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(12898592., grad_fn=<MseLossBackward>)
output :  tensor([[239576.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(332478.3750, grad_fn=<MseLossBackward>)
output :  tensor([[247992.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(8952532., grad_fn=<MseLossBackward>)
output :  tensor([[127826.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(2799216.5000, grad_fn=<MseLossBackward>)
output :  tensor([[111591.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(6927629.5000, grad_fn=<MseLossBackward>)
output :  tensor([[288212.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2184e+10, grad_fn=<MseLossBackward>)
output :  tensor([[174056.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(6535532.5000, grad_fn=<MseLossBackward>)
output :  tensor([[125407.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(165833.4688, grad_fn=<MseLossBackward>)
output :  tensor([[144827.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1969e+08, grad_fn=<MseLossBackward>)
output :  tensor([[201307.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6109e+08, grad_fn=<MseLossBackward>)
output :  tensor([[141093.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(8724.7275, grad_fn=<MseLossBackward>)
output :  tensor([[157750.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4945e+10, grad_fn=<MseLossBackward>)
output :  tensor([[155821.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(3691742., grad_fn=<MseLossBackward>)
output :  tensor([[130743.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1545320.8750, grad_fn=<MseLossBackward>)
output :  tensor([[247812.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7079e+10, grad_fn=<MseLossBackward>)
output :  tensor([[398209.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(14371444., grad_fn=<MseLossBackward>)
output :  tensor([[122427.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8029e+08, grad_fn=<MseLossBackward>)
output :  tensor([[110715.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(60600752., grad_fn=<MseLossBackward>)
output :  tensor([[158338.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1349989.8750, grad_fn=<MseLossBackward>)
output :  tensor([[130936.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3193e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163083.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4712e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173088.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9801e+09, grad_fn=<MseLossBackward>)
output :  tensor([[104850.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1564727.3750, grad_fn=<MseLossBackward>)
output :  tensor([[138378.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(6870869.5000, grad_fn=<MseLossBackward>)
output :  tensor([[364040.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(10585262., grad_fn=<MseLossBackward>)
output :  tensor([[203077.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5931e+09, grad_fn=<MseLossBackward>)
output :  tensor([[179589.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(16725927., grad_fn=<MseLossBackward>)
output :  tensor([[200414.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(6177788., grad_fn=<MseLossBackward>)
output :  tensor([[139854.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(730250.3750, grad_fn=<MseLossBackward>)
output :  tensor([[195558.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1120455.3750, grad_fn=<MseLossBackward>)
output :  tensor([[136759.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5610e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176442.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(20773086., grad_fn=<MseLossBackward>)
output :  tensor([[241027.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(946485.7500, grad_fn=<MseLossBackward>)
output :  tensor([[179997.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(35970192., grad_fn=<MseLossBackward>)
output :  tensor([[109954.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(3821841.7500, grad_fn=<MseLossBackward>)
output :  tensor([[264153.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(166260.0625, grad_fn=<MseLossBackward>)
output :  tensor([[255066.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(25672114., grad_fn=<MseLossBackward>)
output :  tensor([[123361.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(130953.5156, grad_fn=<MseLossBackward>)
output :  tensor([[214996.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6004e+09, grad_fn=<MseLossBackward>)
output :  tensor([[304289.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4144e+08, grad_fn=<MseLossBackward>)
output :  tensor([[203669.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(11089733., grad_fn=<MseLossBackward>)
output :  tensor([[211588.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6489e+10, grad_fn=<MseLossBackward>)
output :  tensor([[160420.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(6351975., grad_fn=<MseLossBackward>)
output :  tensor([[167671.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(5374717.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162527.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(31305248., grad_fn=<MseLossBackward>)
output :  tensor([[168004.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(3983454.7500, grad_fn=<MseLossBackward>)
output :  tensor([[236122.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0162e+09, grad_fn=<MseLossBackward>)
output :  tensor([[220383.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(82313088., grad_fn=<MseLossBackward>)
output :  tensor([[160201.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7429e+08, grad_fn=<MseLossBackward>)
output :  tensor([[122346.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(427481., grad_fn=<MseLossBackward>)
output :  tensor([[177937.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(878876.9375, grad_fn=<MseLossBackward>)
output :  tensor([[181463.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1680e+09, grad_fn=<MseLossBackward>)
output :  tensor([[206251.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5482e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134207.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(50561.7383, grad_fn=<MseLossBackward>)
output :  tensor([[149120.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5736e+08, grad_fn=<MseLossBackward>)
output :  tensor([[275114.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3554403.2500, grad_fn=<MseLossBackward>)
output :  tensor([[87878.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(8287066.5000, grad_fn=<MseLossBackward>)
output :  tensor([[236267.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(53925.5469, grad_fn=<MseLossBackward>)
output :  tensor([[256448.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0659e+11, grad_fn=<MseLossBackward>)
output :  tensor([[168681.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1737535.8750, grad_fn=<MseLossBackward>)
output :  tensor([[191867.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8604e+09, grad_fn=<MseLossBackward>)
output :  tensor([[155320.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(102910.6328, grad_fn=<MseLossBackward>)
output :  tensor([[207699.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8814e+09, grad_fn=<MseLossBackward>)
output :  tensor([[130011.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(1022705.5625, grad_fn=<MseLossBackward>)
output :  tensor([[146144.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1309629.8750, grad_fn=<MseLossBackward>)
output :  tensor([[169064.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0566e+08, grad_fn=<MseLossBackward>)
output :  tensor([[188077.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(4963427., grad_fn=<MseLossBackward>)
output :  tensor([[125273.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(527620.6250, grad_fn=<MseLossBackward>)
output :  tensor([[138882.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(5678019., grad_fn=<MseLossBackward>)
output :  tensor([[174323.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1750866.5000, grad_fn=<MseLossBackward>)
output :  tensor([[196829.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8271e+09, grad_fn=<MseLossBackward>)
output :  tensor([[240862.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4567036., grad_fn=<MseLossBackward>)
output :  tensor([[154895.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(11002.0430, grad_fn=<MseLossBackward>)
output :  tensor([[199265.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(10662980., grad_fn=<MseLossBackward>)
output :  tensor([[161706.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1351e+08, grad_fn=<MseLossBackward>)
output :  tensor([[187298.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(60815384., grad_fn=<MseLossBackward>)
output :  tensor([[174681.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(27231926., grad_fn=<MseLossBackward>)
output :  tensor([[100707.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(13748916., grad_fn=<MseLossBackward>)
output :  tensor([[170908.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1901e+10, grad_fn=<MseLossBackward>)
output :  tensor([[133645.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1833823.7500, grad_fn=<MseLossBackward>)
output :  tensor([[121220.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(38693744., grad_fn=<MseLossBackward>)
output :  tensor([[174156.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(24565.6641, grad_fn=<MseLossBackward>)
output :  tensor([[87760.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(7618807.5000, grad_fn=<MseLossBackward>)
output :  tensor([[290615.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(378878.7188, grad_fn=<MseLossBackward>)
output :  tensor([[170488.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(30124832., grad_fn=<MseLossBackward>)
output :  tensor([[193090.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9622e+10, grad_fn=<MseLossBackward>)
output :  tensor([[244356.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0988e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148024.]], grad_fn=<AddmmBackward>)
loss:  tensor(8856576., grad_fn=<MseLossBackward>)
output :  tensor([[125013.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1027087.2500, grad_fn=<MseLossBackward>)
output :  tensor([[113178.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(45177196., grad_fn=<MseLossBackward>)
output :  tensor([[146471.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9043e+08, grad_fn=<MseLossBackward>)
output :  tensor([[171523.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(6131582., grad_fn=<MseLossBackward>)
output :  tensor([[112737.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(9.1433e+08, grad_fn=<MseLossBackward>)
output :  tensor([[209410.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1792e+10, grad_fn=<MseLossBackward>)
output :  tensor([[240909.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(348173.7500, grad_fn=<MseLossBackward>)
output :  tensor([[251881.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0538e+10, grad_fn=<MseLossBackward>)
output :  tensor([[222127.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8467e+08, grad_fn=<MseLossBackward>)
output :  tensor([[196305.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4207e+10, grad_fn=<MseLossBackward>)
output :  tensor([[187975.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(225921.9688, grad_fn=<MseLossBackward>)
output :  tensor([[205537.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8107e+10, grad_fn=<MseLossBackward>)
output :  tensor([[191017.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1020e+10, grad_fn=<MseLossBackward>)
output :  tensor([[174107.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(21461648., grad_fn=<MseLossBackward>)
output :  tensor([[150265.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(3007081.2500, grad_fn=<MseLossBackward>)
output :  tensor([[338324.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1754465.8750, grad_fn=<MseLossBackward>)
output :  tensor([[211660.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(115408.8281, grad_fn=<MseLossBackward>)
output :  tensor([[159112.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(787573.0625, grad_fn=<MseLossBackward>)
output :  tensor([[185012.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1908e+09, grad_fn=<MseLossBackward>)
output :  tensor([[108970.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(15761334., grad_fn=<MseLossBackward>)
output :  tensor([[273144.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9443e+10, grad_fn=<MseLossBackward>)
output :  tensor([[170863.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(9222894., grad_fn=<MseLossBackward>)
output :  tensor([[223112.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(92395352., grad_fn=<MseLossBackward>)
output :  tensor([[209330.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3618e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178280.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(845710.1250, grad_fn=<MseLossBackward>)
output :  tensor([[205272.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(12057822., grad_fn=<MseLossBackward>)
output :  tensor([[152392.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(6796856.5000, grad_fn=<MseLossBackward>)
output :  tensor([[150104.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5104e+09, grad_fn=<MseLossBackward>)
output :  tensor([[119499.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(998094.6875, grad_fn=<MseLossBackward>)
output :  tensor([[139258.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(549358.9375, grad_fn=<MseLossBackward>)
output :  tensor([[146535.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(6072297., grad_fn=<MseLossBackward>)
output :  tensor([[201455.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6014e+10, grad_fn=<MseLossBackward>)
output :  tensor([[161855.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(5550000., grad_fn=<MseLossBackward>)
output :  tensor([[102117.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(6851020., grad_fn=<MseLossBackward>)
output :  tensor([[224749.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3257e+08, grad_fn=<MseLossBackward>)
output :  tensor([[187485.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8338e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175750.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(539191.8750, grad_fn=<MseLossBackward>)
output :  tensor([[84220.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(4928816.5000, grad_fn=<MseLossBackward>)
output :  tensor([[130545.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(4183910.5000, grad_fn=<MseLossBackward>)
output :  tensor([[215715.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2942565., grad_fn=<MseLossBackward>)
output :  tensor([[144064.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(4108.0088, grad_fn=<MseLossBackward>)
output :  tensor([[129590.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(167453.5938, grad_fn=<MseLossBackward>)
output :  tensor([[145470.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(8242102.5000, grad_fn=<MseLossBackward>)
output :  tensor([[178471.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6786e+09, grad_fn=<MseLossBackward>)
output :  tensor([[143327.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(452109.1562, grad_fn=<MseLossBackward>)
output :  tensor([[161295.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1677389.2500, grad_fn=<MseLossBackward>)
output :  tensor([[215543.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(295307.3438, grad_fn=<MseLossBackward>)
output :  tensor([[138129.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0976e+09, grad_fn=<MseLossBackward>)
output :  tensor([[257227.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(4960503.5000, grad_fn=<MseLossBackward>)
output :  tensor([[159976.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(227439.5781, grad_fn=<MseLossBackward>)
output :  tensor([[129988.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2214795., grad_fn=<MseLossBackward>)
output :  tensor([[95822.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(675722.5625, grad_fn=<MseLossBackward>)
output :  tensor([[153437.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7523e+09, grad_fn=<MseLossBackward>)
output :  tensor([[180944.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1090001.2500, grad_fn=<MseLossBackward>)
output :  tensor([[119737.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(581465.8125, grad_fn=<MseLossBackward>)
output :  tensor([[187526.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7159e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144043.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1659e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151495.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2545520.5000, grad_fn=<MseLossBackward>)
output :  tensor([[187488.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(68611.2500, grad_fn=<MseLossBackward>)
output :  tensor([[251952.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6912e+09, grad_fn=<MseLossBackward>)
output :  tensor([[90543.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(915071.6250, grad_fn=<MseLossBackward>)
output :  tensor([[236692.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(10938936., grad_fn=<MseLossBackward>)
output :  tensor([[126245.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(5083792., grad_fn=<MseLossBackward>)
output :  tensor([[165480.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0084e+10, grad_fn=<MseLossBackward>)
output :  tensor([[113620.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8553e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174850.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1320775.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163918.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0115e+08, grad_fn=<MseLossBackward>)
output :  tensor([[153788.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4236e+08, grad_fn=<MseLossBackward>)
output :  tensor([[235029.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(15761520., grad_fn=<MseLossBackward>)
output :  tensor([[226799.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(9.7347e+08, grad_fn=<MseLossBackward>)
output :  tensor([[127488.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(238388.0625, grad_fn=<MseLossBackward>)
output :  tensor([[128661.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(7081004., grad_fn=<MseLossBackward>)
output :  tensor([[225046.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(3814636.2500, grad_fn=<MseLossBackward>)
output :  tensor([[230361.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(13241184., grad_fn=<MseLossBackward>)
output :  tensor([[227687.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(974909.3750, grad_fn=<MseLossBackward>)
output :  tensor([[146674.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1757571.6250, grad_fn=<MseLossBackward>)
output :  tensor([[210662.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(438906.2500, grad_fn=<MseLossBackward>)
output :  tensor([[127554.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(57068344., grad_fn=<MseLossBackward>)
output :  tensor([[133021.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(271669., grad_fn=<MseLossBackward>)
output :  tensor([[309946.]], grad_fn=<AddmmBackward>)
loss:  tensor(25542916., grad_fn=<MseLossBackward>)
output :  tensor([[140284.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(511560.2188, grad_fn=<MseLossBackward>)
output :  tensor([[121420.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9616e+09, grad_fn=<MseLossBackward>)
output :  tensor([[109212.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(82768.5938, grad_fn=<MseLossBackward>)
output :  tensor([[154384.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2816e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176742.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6005e+09, grad_fn=<MseLossBackward>)
output :  tensor([[172699.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(90516.3672, grad_fn=<MseLossBackward>)
output :  tensor([[191474.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(90729792., grad_fn=<MseLossBackward>)
output :  tensor([[97711.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(5238627., grad_fn=<MseLossBackward>)
output :  tensor([[178240.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(576270.7500, grad_fn=<MseLossBackward>)
output :  tensor([[170037.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(4568706., grad_fn=<MseLossBackward>)
output :  tensor([[139284.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(80851.3672, grad_fn=<MseLossBackward>)
output :  tensor([[257536.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0315e+10, grad_fn=<MseLossBackward>)
output :  tensor([[141648.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2091e+09, grad_fn=<MseLossBackward>)
output :  tensor([[171892.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1226556.2500, grad_fn=<MseLossBackward>)
output :  tensor([[143395.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(11527192., grad_fn=<MseLossBackward>)
output :  tensor([[202253.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(3073063.7500, grad_fn=<MseLossBackward>)
output :  tensor([[169178.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(674733.8750, grad_fn=<MseLossBackward>)
output :  tensor([[241947.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(4211922.5000, grad_fn=<MseLossBackward>)
output :  tensor([[133450.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1102237.5000, grad_fn=<MseLossBackward>)
output :  tensor([[151319.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(3879299.5000, grad_fn=<MseLossBackward>)
output :  tensor([[209486.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(30398510., grad_fn=<MseLossBackward>)
output :  tensor([[162226.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(7694469., grad_fn=<MseLossBackward>)
output :  tensor([[192952.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(15624480., grad_fn=<MseLossBackward>)
output :  tensor([[133905.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2976e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129700.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(490306.3125, grad_fn=<MseLossBackward>)
output :  tensor([[139692.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(94344.9609, grad_fn=<MseLossBackward>)
output :  tensor([[199928.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8402e+09, grad_fn=<MseLossBackward>)
output :  tensor([[167490.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7553e+09, grad_fn=<MseLossBackward>)
output :  tensor([[76286.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6526e+08, grad_fn=<MseLossBackward>)
output :  tensor([[94180.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(93711624., grad_fn=<MseLossBackward>)
output :  tensor([[259115.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(33899688., grad_fn=<MseLossBackward>)
output :  tensor([[204000.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2251e+09, grad_fn=<MseLossBackward>)
output :  tensor([[115340.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(116020.0703, grad_fn=<MseLossBackward>)
output :  tensor([[158389.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4743e+08, grad_fn=<MseLossBackward>)
output :  tensor([[207257.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6237e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180860.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9458e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158585.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(12858612., grad_fn=<MseLossBackward>)
output :  tensor([[168411.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2523679.7500, grad_fn=<MseLossBackward>)
output :  tensor([[114433.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(320913.4062, grad_fn=<MseLossBackward>)
output :  tensor([[162949.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(63195296., grad_fn=<MseLossBackward>)
output :  tensor([[195239.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3596e+08, grad_fn=<MseLossBackward>)
output :  tensor([[219027.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(223167.6719, grad_fn=<MseLossBackward>)
output :  tensor([[246734.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4827e+11, grad_fn=<MseLossBackward>)
output :  tensor([[144903.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(4397081.5000, grad_fn=<MseLossBackward>)
output :  tensor([[108305.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(30393.0195, grad_fn=<MseLossBackward>)
output :  tensor([[169094.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6397e+08, grad_fn=<MseLossBackward>)
output :  tensor([[146838.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(13407955., grad_fn=<MseLossBackward>)
output :  tensor([[231334.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(32098952., grad_fn=<MseLossBackward>)
output :  tensor([[118170.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(10050881., grad_fn=<MseLossBackward>)
output :  tensor([[183068.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(28344.8789, grad_fn=<MseLossBackward>)
output :  tensor([[188714.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(4059595.2500, grad_fn=<MseLossBackward>)
output :  tensor([[162904.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4679e+10, grad_fn=<MseLossBackward>)
output :  tensor([[96822.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5036e+08, grad_fn=<MseLossBackward>)
output :  tensor([[238944.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(3087.1914, grad_fn=<MseLossBackward>)
output :  tensor([[178067.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(4274168.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139198.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(643078.6875, grad_fn=<MseLossBackward>)
output :  tensor([[237858.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(8169771.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162435.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(318113.6250, grad_fn=<MseLossBackward>)
output :  tensor([[202720.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4952e+10, grad_fn=<MseLossBackward>)
output :  tensor([[133310.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2853776.7500, grad_fn=<MseLossBackward>)
output :  tensor([[187578.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5424e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136775.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(601133.6875, grad_fn=<MseLossBackward>)
output :  tensor([[225591.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0834e+08, grad_fn=<MseLossBackward>)
output :  tensor([[227947.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8632e+08, grad_fn=<MseLossBackward>)
output :  tensor([[91079.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1166062.5000, grad_fn=<MseLossBackward>)
output :  tensor([[160318.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(781953.3125, grad_fn=<MseLossBackward>)
output :  tensor([[247026.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5339e+10, grad_fn=<MseLossBackward>)
output :  tensor([[149597.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(21139880., grad_fn=<MseLossBackward>)
output :  tensor([[107888.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6719e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164287.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(45209.3906, grad_fn=<MseLossBackward>)
output :  tensor([[148507.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(20315726., grad_fn=<MseLossBackward>)
output :  tensor([[128477.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(77171.1016, grad_fn=<MseLossBackward>)
output :  tensor([[190322.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7167e+09, grad_fn=<MseLossBackward>)
output :  tensor([[124701.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(4846602., grad_fn=<MseLossBackward>)
output :  tensor([[149843.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(4650627., grad_fn=<MseLossBackward>)
output :  tensor([[167803.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(15573012., grad_fn=<MseLossBackward>)
output :  tensor([[152488.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2214609., grad_fn=<MseLossBackward>)
output :  tensor([[162078.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(674785.2500, grad_fn=<MseLossBackward>)
output :  tensor([[136084.]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3354e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133310.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1718270.3750, grad_fn=<MseLossBackward>)
output :  tensor([[154918.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5340e+08, grad_fn=<MseLossBackward>)
output :  tensor([[145088.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(876359.2500, grad_fn=<MseLossBackward>)
output :  tensor([[163109.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1847773., grad_fn=<MseLossBackward>)
output :  tensor([[138421.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1350e+08, grad_fn=<MseLossBackward>)
output :  tensor([[146498.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(5297118., grad_fn=<MseLossBackward>)
output :  tensor([[184700.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(10885051., grad_fn=<MseLossBackward>)
output :  tensor([[168713.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(82091.2031, grad_fn=<MseLossBackward>)
output :  tensor([[181164.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1356715.3750, grad_fn=<MseLossBackward>)
output :  tensor([[220457.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(209063.2812, grad_fn=<MseLossBackward>)
output :  tensor([[111281.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(11432059., grad_fn=<MseLossBackward>)
output :  tensor([[137788.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6612e+08, grad_fn=<MseLossBackward>)
output :  tensor([[290428.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(19609952., grad_fn=<MseLossBackward>)
output :  tensor([[119820.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(14595862., grad_fn=<MseLossBackward>)
output :  tensor([[177185.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8331e+09, grad_fn=<MseLossBackward>)
output :  tensor([[181861.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(9849986., grad_fn=<MseLossBackward>)
output :  tensor([[184288.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1468716.7500, grad_fn=<MseLossBackward>)
output :  tensor([[252016.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2825e+08, grad_fn=<MseLossBackward>)
output :  tensor([[219509.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(6200644.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128680.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1893e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174729.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7216e+08, grad_fn=<MseLossBackward>)
output :  tensor([[124929.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(864144.5625, grad_fn=<MseLossBackward>)
output :  tensor([[183917.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4955e+10, grad_fn=<MseLossBackward>)
output :  tensor([[155485.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(6178875.5000, grad_fn=<MseLossBackward>)
output :  tensor([[153933.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(55258084., grad_fn=<MseLossBackward>)
output :  tensor([[206282.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(300.2639, grad_fn=<MseLossBackward>)
output :  tensor([[146198.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8765e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176243.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(59086.9766, grad_fn=<MseLossBackward>)
output :  tensor([[253132.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9526e+08, grad_fn=<MseLossBackward>)
output :  tensor([[147662.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(113674.3359, grad_fn=<MseLossBackward>)
output :  tensor([[201286.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1900693., grad_fn=<MseLossBackward>)
output :  tensor([[163163.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(10329495., grad_fn=<MseLossBackward>)
output :  tensor([[123138.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2347e+09, grad_fn=<MseLossBackward>)
output :  tensor([[130943.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(23106198., grad_fn=<MseLossBackward>)
output :  tensor([[181472.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(6387229.5000, grad_fn=<MseLossBackward>)
output :  tensor([[194036.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(16291062., grad_fn=<MseLossBackward>)
output :  tensor([[229644.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5230e+09, grad_fn=<MseLossBackward>)
output :  tensor([[257442.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(195764.7656, grad_fn=<MseLossBackward>)
output :  tensor([[184763.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8019e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144401.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7986e+09, grad_fn=<MseLossBackward>)
output :  tensor([[148795.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(18448368., grad_fn=<MseLossBackward>)
output :  tensor([[70930.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(9.5672e+08, grad_fn=<MseLossBackward>)
output :  tensor([[140112.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(26133822., grad_fn=<MseLossBackward>)
output :  tensor([[129996.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(1203117.6250, grad_fn=<MseLossBackward>)
output :  tensor([[153374.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(390761.7188, grad_fn=<MseLossBackward>)
output :  tensor([[127283.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(80283.6797, grad_fn=<MseLossBackward>)
output :  tensor([[77516.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(1033987.1250, grad_fn=<MseLossBackward>)
output :  tensor([[83330.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(1770417.3750, grad_fn=<MseLossBackward>)
output :  tensor([[220281.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3732e+08, grad_fn=<MseLossBackward>)
output :  tensor([[141166.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2176e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129757.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(551178.6250, grad_fn=<MseLossBackward>)
output :  tensor([[167061.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(3766.8906, grad_fn=<MseLossBackward>)
output :  tensor([[232726.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(5168589., grad_fn=<MseLossBackward>)
output :  tensor([[186239.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(34814240., grad_fn=<MseLossBackward>)
output :  tensor([[156126.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(15895.6934, grad_fn=<MseLossBackward>)
output :  tensor([[197275.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(389395.5000, grad_fn=<MseLossBackward>)
output :  tensor([[202287.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2050e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137698.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(488164.2188, grad_fn=<MseLossBackward>)
output :  tensor([[157143.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(4595329., grad_fn=<MseLossBackward>)
output :  tensor([[135492.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(257429.3906, grad_fn=<MseLossBackward>)
output :  tensor([[197140.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0798e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158870.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(23720552., grad_fn=<MseLossBackward>)
output :  tensor([[135440.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7590e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144823.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(5883.3691, grad_fn=<MseLossBackward>)
output :  tensor([[203559.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(71235976., grad_fn=<MseLossBackward>)
output :  tensor([[104389.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0127e+08, grad_fn=<MseLossBackward>)
output :  tensor([[167385.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(13035.2168, grad_fn=<MseLossBackward>)
output :  tensor([[128731.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(535572.3750, grad_fn=<MseLossBackward>)
output :  tensor([[146003.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(992514.0625, grad_fn=<MseLossBackward>)
output :  tensor([[102572.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6152e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137730.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(53187.8906, grad_fn=<MseLossBackward>)
output :  tensor([[238090.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(4371039.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144066.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(871714., grad_fn=<MseLossBackward>)
output :  tensor([[139517.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(4069360.5000, grad_fn=<MseLossBackward>)
output :  tensor([[166518.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4836e+09, grad_fn=<MseLossBackward>)
output :  tensor([[265577.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5433e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172218.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(7738481., grad_fn=<MseLossBackward>)
output :  tensor([[105744.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(8811899., grad_fn=<MseLossBackward>)
output :  tensor([[202094.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6860e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159734.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(540087.1875, grad_fn=<MseLossBackward>)
output :  tensor([[163796.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5638e+10, grad_fn=<MseLossBackward>)
output :  tensor([[97096.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(1447679., grad_fn=<MseLossBackward>)
output :  tensor([[121725.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(3512842.2500, grad_fn=<MseLossBackward>)
output :  tensor([[153148.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(8132567., grad_fn=<MseLossBackward>)
output :  tensor([[142724.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(7423666.5000, grad_fn=<MseLossBackward>)
output :  tensor([[199669.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(109509.2891, grad_fn=<MseLossBackward>)
output :  tensor([[142199.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(39825.1914, grad_fn=<MseLossBackward>)
output :  tensor([[257676.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(21195666., grad_fn=<MseLossBackward>)
output :  tensor([[127211.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1704e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163263.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(5002701., grad_fn=<MseLossBackward>)
output :  tensor([[189657.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1339806.2500, grad_fn=<MseLossBackward>)
output :  tensor([[124872.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2118e+08, grad_fn=<MseLossBackward>)
output :  tensor([[248637.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1855342., grad_fn=<MseLossBackward>)
output :  tensor([[158101.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3514e+08, grad_fn=<MseLossBackward>)
output :  tensor([[240684.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(21770826., grad_fn=<MseLossBackward>)
output :  tensor([[146394.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(5735351.5000, grad_fn=<MseLossBackward>)
output :  tensor([[209542.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(209320.5469, grad_fn=<MseLossBackward>)
output :  tensor([[173575.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1381873.7500, grad_fn=<MseLossBackward>)
output :  tensor([[154758.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(575108.9375, grad_fn=<MseLossBackward>)
output :  tensor([[117749.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(62550.7930, grad_fn=<MseLossBackward>)
output :  tensor([[235457.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6659e+09, grad_fn=<MseLossBackward>)
output :  tensor([[237835.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(4686548.5000, grad_fn=<MseLossBackward>)
output :  tensor([[152967.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(136472.5156, grad_fn=<MseLossBackward>)
output :  tensor([[255557.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(431977.5625, grad_fn=<MseLossBackward>)
output :  tensor([[124624.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0243e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180111.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(16908030., grad_fn=<MseLossBackward>)
output :  tensor([[162321.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(5390740.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128856.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(4596066., grad_fn=<MseLossBackward>)
output :  tensor([[194756.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2584e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166742.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(7523449., grad_fn=<MseLossBackward>)
output :  tensor([[163476.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(227067.1406, grad_fn=<MseLossBackward>)
output :  tensor([[157733.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(70789.2500, grad_fn=<MseLossBackward>)
output :  tensor([[150973.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1152301.6250, grad_fn=<MseLossBackward>)
output :  tensor([[174857.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2716e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159996.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(13.1406, grad_fn=<MseLossBackward>)
output :  tensor([[373921.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0096e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134676.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(58928652., grad_fn=<MseLossBackward>)
output :  tensor([[128635.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8607e+09, grad_fn=<MseLossBackward>)
output :  tensor([[276430.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(22868420., grad_fn=<MseLossBackward>)
output :  tensor([[159041.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(8754386., grad_fn=<MseLossBackward>)
output :  tensor([[131314.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1695e+08, grad_fn=<MseLossBackward>)
output :  tensor([[242816.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1700e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174491.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(36096816., grad_fn=<MseLossBackward>)
output :  tensor([[154200.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(4842406.5000, grad_fn=<MseLossBackward>)
output :  tensor([[147124.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(4514894.5000, grad_fn=<MseLossBackward>)
output :  tensor([[154004.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9257e+08, grad_fn=<MseLossBackward>)
output :  tensor([[103417.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(11678025., grad_fn=<MseLossBackward>)
output :  tensor([[78267.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3371e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165219.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(48351.8867, grad_fn=<MseLossBackward>)
output :  tensor([[187595.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6325e+09, grad_fn=<MseLossBackward>)
output :  tensor([[160546.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(6484185., grad_fn=<MseLossBackward>)
output :  tensor([[163665.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(38013584., grad_fn=<MseLossBackward>)
output :  tensor([[139089.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2688370.2500, grad_fn=<MseLossBackward>)
output :  tensor([[211145.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(26994844., grad_fn=<MseLossBackward>)
output :  tensor([[140341.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(5482695.5000, grad_fn=<MseLossBackward>)
output :  tensor([[183912.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5898e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145328.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(450828.3125, grad_fn=<MseLossBackward>)
output :  tensor([[111918.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3630e+08, grad_fn=<MseLossBackward>)
output :  tensor([[96509.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(6299355., grad_fn=<MseLossBackward>)
output :  tensor([[174542.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(209535.0625, grad_fn=<MseLossBackward>)
output :  tensor([[264131.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(13921061., grad_fn=<MseLossBackward>)
output :  tensor([[140766.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(537816., grad_fn=<MseLossBackward>)
output :  tensor([[161688.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3215857.7500, grad_fn=<MseLossBackward>)
output :  tensor([[134479.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(3918729.5000, grad_fn=<MseLossBackward>)
output :  tensor([[143252.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(39033796., grad_fn=<MseLossBackward>)
output :  tensor([[170615.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(7375468., grad_fn=<MseLossBackward>)
output :  tensor([[128153.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(1330291.8750, grad_fn=<MseLossBackward>)
output :  tensor([[173412.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0730e+08, grad_fn=<MseLossBackward>)
output :  tensor([[156364.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(404456.2500, grad_fn=<MseLossBackward>)
output :  tensor([[117070.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(325479.1562, grad_fn=<MseLossBackward>)
output :  tensor([[161581.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1006e+09, grad_fn=<MseLossBackward>)
output :  tensor([[47720.6680]], grad_fn=<AddmmBackward>)
loss:  tensor(18312682., grad_fn=<MseLossBackward>)
output :  tensor([[229479.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8923e+09, grad_fn=<MseLossBackward>)
output :  tensor([[200879.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(14557.9307, grad_fn=<MseLossBackward>)
output :  tensor([[183731.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1609488.6250, grad_fn=<MseLossBackward>)
output :  tensor([[106048.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2349.2197, grad_fn=<MseLossBackward>)
output :  tensor([[89978.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(8870066., grad_fn=<MseLossBackward>)
output :  tensor([[139736.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(69514.6172, grad_fn=<MseLossBackward>)
output :  tensor([[221638.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2362e+09, grad_fn=<MseLossBackward>)
output :  tensor([[203746.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(14087589., grad_fn=<MseLossBackward>)
output :  tensor([[163960.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1080397.8750, grad_fn=<MseLossBackward>)
output :  tensor([[172821.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4969e+09, grad_fn=<MseLossBackward>)
output :  tensor([[189433.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(320922.2500, grad_fn=<MseLossBackward>)
output :  tensor([[88171.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(1372357.3750, grad_fn=<MseLossBackward>)
output :  tensor([[140596.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(356222.4688, grad_fn=<MseLossBackward>)
output :  tensor([[114178.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(13534351., grad_fn=<MseLossBackward>)
output :  tensor([[148252.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5110e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173798.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8317e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194269.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1515e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179184.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(665779.5000, grad_fn=<MseLossBackward>)
output :  tensor([[98862.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(5581997., grad_fn=<MseLossBackward>)
output :  tensor([[118439.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(882689.6250, grad_fn=<MseLossBackward>)
output :  tensor([[162106.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7933e+08, grad_fn=<MseLossBackward>)
output :  tensor([[201326.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1760763.1250, grad_fn=<MseLossBackward>)
output :  tensor([[143812.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(35091.8281, grad_fn=<MseLossBackward>)
train_loss: [2.611735e+09]
epoch_result tensor([0.])
output :  tensor([[161799.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(10888247., grad_fn=<MseLossBackward>)
output :  tensor([[121050.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(900645.5000, grad_fn=<MseLossBackward>)
output :  tensor([[194881.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(462676.2812, grad_fn=<MseLossBackward>)
output :  tensor([[177839.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(704288.1250, grad_fn=<MseLossBackward>)
output :  tensor([[152946.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2769e+08, grad_fn=<MseLossBackward>)
output :  tensor([[132727.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(22344676., grad_fn=<MseLossBackward>)
output :  tensor([[140377.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(387331.1875, grad_fn=<MseLossBackward>)
output :  tensor([[119707.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(500136.2500, grad_fn=<MseLossBackward>)
output :  tensor([[67428.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(79726904., grad_fn=<MseLossBackward>)
output :  tensor([[167279.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1638000., grad_fn=<MseLossBackward>)
output :  tensor([[142021.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(4086778., grad_fn=<MseLossBackward>)
output :  tensor([[223456.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2381379.5000, grad_fn=<MseLossBackward>)
output :  tensor([[169105.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(11123.6572, grad_fn=<MseLossBackward>)
output :  tensor([[252448.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(7552964., grad_fn=<MseLossBackward>)
output :  tensor([[53552.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2095980., grad_fn=<MseLossBackward>)
output :  tensor([[161471.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8801e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179345.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(18883234., grad_fn=<MseLossBackward>)
output :  tensor([[156326.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(30254.2539, grad_fn=<MseLossBackward>)
output :  tensor([[276993.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(3974416., grad_fn=<MseLossBackward>)
output :  tensor([[193480.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(12386550., grad_fn=<MseLossBackward>)
output :  tensor([[137150.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5817e+10, grad_fn=<MseLossBackward>)
output :  tensor([[194926.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1098009.2500, grad_fn=<MseLossBackward>)
output :  tensor([[180984.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9285e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151984.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(969424.8750, grad_fn=<MseLossBackward>)
output :  tensor([[176669.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(44475768., grad_fn=<MseLossBackward>)
output :  tensor([[84610.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(623433.6250, grad_fn=<MseLossBackward>)
output :  tensor([[169441.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1857e+09, grad_fn=<MseLossBackward>)
output :  tensor([[186185.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1404743.5000, grad_fn=<MseLossBackward>)
output :  tensor([[209571.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1094e+09, grad_fn=<MseLossBackward>)
output :  tensor([[110674.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(455614.4688, grad_fn=<MseLossBackward>)
output :  tensor([[168530.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(6096424., grad_fn=<MseLossBackward>)
output :  tensor([[139272.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(7688749., grad_fn=<MseLossBackward>)
output :  tensor([[129952.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(906348.6250, grad_fn=<MseLossBackward>)
output :  tensor([[121755.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(5086505., grad_fn=<MseLossBackward>)
output :  tensor([[146853.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(8.9120e+08, grad_fn=<MseLossBackward>)
output :  tensor([[168531.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1453e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144581.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(26204002., grad_fn=<MseLossBackward>)
output :  tensor([[181676.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2811333.2500, grad_fn=<MseLossBackward>)
output :  tensor([[144623.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(13132923., grad_fn=<MseLossBackward>)
output :  tensor([[106454.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7073e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134216.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5260e+09, grad_fn=<MseLossBackward>)
output :  tensor([[130077.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(24228468., grad_fn=<MseLossBackward>)
output :  tensor([[137437.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0893e+08, grad_fn=<MseLossBackward>)
output :  tensor([[220371.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(21423302., grad_fn=<MseLossBackward>)
output :  tensor([[131607.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(413228., grad_fn=<MseLossBackward>)
output :  tensor([[152829.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(14667105., grad_fn=<MseLossBackward>)
output :  tensor([[116065.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(16525686., grad_fn=<MseLossBackward>)
output :  tensor([[159795.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(41928.9609, grad_fn=<MseLossBackward>)
output :  tensor([[146799.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3233e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195042.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(9259564., grad_fn=<MseLossBackward>)
output :  tensor([[135068.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(383083.6250, grad_fn=<MseLossBackward>)
output :  tensor([[121325.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2826e+08, grad_fn=<MseLossBackward>)
output :  tensor([[232472.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2333876.7500, grad_fn=<MseLossBackward>)
output :  tensor([[166387.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2187e+09, grad_fn=<MseLossBackward>)
output :  tensor([[162690.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(13616677., grad_fn=<MseLossBackward>)
output :  tensor([[204031.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8382e+10, grad_fn=<MseLossBackward>)
output :  tensor([[246275.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1605e+10, grad_fn=<MseLossBackward>)
output :  tensor([[140923.]], grad_fn=<AddmmBackward>)
loss:  tensor(6640929., grad_fn=<MseLossBackward>)
output :  tensor([[134526.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(276971.9688, grad_fn=<MseLossBackward>)
output :  tensor([[158107.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(9655585., grad_fn=<MseLossBackward>)
output :  tensor([[135593.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(31292486., grad_fn=<MseLossBackward>)
output :  tensor([[181433.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1727e+09, grad_fn=<MseLossBackward>)
output :  tensor([[181386.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(7361641., grad_fn=<MseLossBackward>)
output :  tensor([[158652.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(8108256., grad_fn=<MseLossBackward>)
output :  tensor([[151785.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(77184464., grad_fn=<MseLossBackward>)
output :  tensor([[142177.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(104298.7188, grad_fn=<MseLossBackward>)
output :  tensor([[140631.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(19086660., grad_fn=<MseLossBackward>)
output :  tensor([[172010.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5800e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193663.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4459e+08, grad_fn=<MseLossBackward>)
output :  tensor([[140698.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(17623728., grad_fn=<MseLossBackward>)
output :  tensor([[173197.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1682614.3750, grad_fn=<MseLossBackward>)
output :  tensor([[178533.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(6083776.5000, grad_fn=<MseLossBackward>)
output :  tensor([[115566.4922]], grad_fn=<AddmmBackward>)
loss:  tensor(320913.4062, grad_fn=<MseLossBackward>)
output :  tensor([[218589.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(5808250.5000, grad_fn=<MseLossBackward>)
output :  tensor([[188452.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(24526792., grad_fn=<MseLossBackward>)
output :  tensor([[124785.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(510030.3125, grad_fn=<MseLossBackward>)
output :  tensor([[197028.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(279328.7812, grad_fn=<MseLossBackward>)
output :  tensor([[177604.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(7315588., grad_fn=<MseLossBackward>)
output :  tensor([[206113.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2449e+10, grad_fn=<MseLossBackward>)
output :  tensor([[209732.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1607546.6250, grad_fn=<MseLossBackward>)
output :  tensor([[166957.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2930e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193657.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(709832.5625, grad_fn=<MseLossBackward>)
output :  tensor([[111298.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2896006.2500, grad_fn=<MseLossBackward>)
output :  tensor([[115235.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(7480695., grad_fn=<MseLossBackward>)
output :  tensor([[112993.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(986747.3125, grad_fn=<MseLossBackward>)
output :  tensor([[147847.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1097616.3750, grad_fn=<MseLossBackward>)
output :  tensor([[160831.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3055e+10, grad_fn=<MseLossBackward>)
output :  tensor([[177654.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(5503569.5000, grad_fn=<MseLossBackward>)
output :  tensor([[129659.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4665330., grad_fn=<MseLossBackward>)
output :  tensor([[144297.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(493462.3438, grad_fn=<MseLossBackward>)
output :  tensor([[187701.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7880e+09, grad_fn=<MseLossBackward>)
output :  tensor([[118663.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(3108802.5000, grad_fn=<MseLossBackward>)
output :  tensor([[198218.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1484628., grad_fn=<MseLossBackward>)
output :  tensor([[145302.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(91402.2969, grad_fn=<MseLossBackward>)
output :  tensor([[212051.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(720217.4375, grad_fn=<MseLossBackward>)
output :  tensor([[126992.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(984715.1250, grad_fn=<MseLossBackward>)
output :  tensor([[243797.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(20529678., grad_fn=<MseLossBackward>)
output :  tensor([[236165.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3848e+09, grad_fn=<MseLossBackward>)
output :  tensor([[147748.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6726e+08, grad_fn=<MseLossBackward>)
output :  tensor([[86158.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3294e+08, grad_fn=<MseLossBackward>)
output :  tensor([[192338.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8164e+09, grad_fn=<MseLossBackward>)
output :  tensor([[81386.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(149370.1719, grad_fn=<MseLossBackward>)
output :  tensor([[138598.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(812392.3750, grad_fn=<MseLossBackward>)
output :  tensor([[76744.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(1548566.3750, grad_fn=<MseLossBackward>)
output :  tensor([[143282.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(108487.8906, grad_fn=<MseLossBackward>)
output :  tensor([[173322.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(7168588., grad_fn=<MseLossBackward>)
output :  tensor([[152642.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(735520.6250, grad_fn=<MseLossBackward>)
output :  tensor([[106994.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(164791.5938, grad_fn=<MseLossBackward>)
output :  tensor([[203372.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2629e+10, grad_fn=<MseLossBackward>)
output :  tensor([[128634.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(17989.5156, grad_fn=<MseLossBackward>)
output :  tensor([[270242.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(95211248., grad_fn=<MseLossBackward>)
output :  tensor([[300584.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(88658704., grad_fn=<MseLossBackward>)
output :  tensor([[108325.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(681772.7500, grad_fn=<MseLossBackward>)
output :  tensor([[169557.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(8660513., grad_fn=<MseLossBackward>)
output :  tensor([[134406.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9730e+08, grad_fn=<MseLossBackward>)
output :  tensor([[146171.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(51429740., grad_fn=<MseLossBackward>)
output :  tensor([[132999.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(7557087., grad_fn=<MseLossBackward>)
output :  tensor([[127889.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(8350113., grad_fn=<MseLossBackward>)
output :  tensor([[134679.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3401e+08, grad_fn=<MseLossBackward>)
output :  tensor([[225073.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9175e+10, grad_fn=<MseLossBackward>)
output :  tensor([[187176.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3662e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145364.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2144028., grad_fn=<MseLossBackward>)
output :  tensor([[134071.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(43185844., grad_fn=<MseLossBackward>)
output :  tensor([[109192.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(4232759.5000, grad_fn=<MseLossBackward>)
output :  tensor([[252297.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3249e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136115.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1244410., grad_fn=<MseLossBackward>)
output :  tensor([[203644.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(415219.1250, grad_fn=<MseLossBackward>)
output :  tensor([[104854.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2113.1260, grad_fn=<MseLossBackward>)
output :  tensor([[139963.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(175.9768, grad_fn=<MseLossBackward>)
output :  tensor([[207654.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8376e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180385.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(235634.3906, grad_fn=<MseLossBackward>)
output :  tensor([[185500.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(250125.0156, grad_fn=<MseLossBackward>)
output :  tensor([[162351.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1506e+10, grad_fn=<MseLossBackward>)
output :  tensor([[294648.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6282e+09, grad_fn=<MseLossBackward>)
output :  tensor([[198088.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(35385.1367, grad_fn=<MseLossBackward>)
output :  tensor([[257716.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1067e+10, grad_fn=<MseLossBackward>)
output :  tensor([[221375.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9914e+09, grad_fn=<MseLossBackward>)
output :  tensor([[278539.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4792e+09, grad_fn=<MseLossBackward>)
output :  tensor([[222729.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1614964.3750, grad_fn=<MseLossBackward>)
output :  tensor([[222334.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8786e+10, grad_fn=<MseLossBackward>)
output :  tensor([[194633.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(5601579.5000, grad_fn=<MseLossBackward>)
output :  tensor([[159536.]], grad_fn=<AddmmBackward>)
loss:  tensor(9.3245e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134065.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2451524.2500, grad_fn=<MseLossBackward>)
output :  tensor([[133406.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(4384639.5000, grad_fn=<MseLossBackward>)
output :  tensor([[94583.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(12840240., grad_fn=<MseLossBackward>)
output :  tensor([[103143.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(23581874., grad_fn=<MseLossBackward>)
output :  tensor([[271051.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3465e+09, grad_fn=<MseLossBackward>)
output :  tensor([[234600.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(159263.3438, grad_fn=<MseLossBackward>)
output :  tensor([[146904.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(3625275.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135469.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(4122676.5000, grad_fn=<MseLossBackward>)
output :  tensor([[174793.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1124362., grad_fn=<MseLossBackward>)
output :  tensor([[144316.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(871218.0625, grad_fn=<MseLossBackward>)
output :  tensor([[166493.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8438e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165657.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(432429.5312, grad_fn=<MseLossBackward>)
output :  tensor([[138135.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1289431.2500, grad_fn=<MseLossBackward>)
output :  tensor([[188228.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3203e+09, grad_fn=<MseLossBackward>)
output :  tensor([[111298.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(491510.5312, grad_fn=<MseLossBackward>)
output :  tensor([[171874.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(15809.1328, grad_fn=<MseLossBackward>)
output :  tensor([[118922.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(1161629.2500, grad_fn=<MseLossBackward>)
output :  tensor([[85716.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1647011.2500, grad_fn=<MseLossBackward>)
output :  tensor([[178282.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2950557.7500, grad_fn=<MseLossBackward>)
output :  tensor([[110986.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(1180431.3750, grad_fn=<MseLossBackward>)
output :  tensor([[234773.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(17864226., grad_fn=<MseLossBackward>)
output :  tensor([[246016.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1032795.8125, grad_fn=<MseLossBackward>)
output :  tensor([[135569.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(36844712., grad_fn=<MseLossBackward>)
output :  tensor([[110213.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1574201.5000, grad_fn=<MseLossBackward>)
output :  tensor([[289286.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1865e+10, grad_fn=<MseLossBackward>)
output :  tensor([[172531.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1064669.2500, grad_fn=<MseLossBackward>)
output :  tensor([[120792.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(17704502., grad_fn=<MseLossBackward>)
output :  tensor([[143364.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4336e+08, grad_fn=<MseLossBackward>)
output :  tensor([[199944.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9757e+08, grad_fn=<MseLossBackward>)
output :  tensor([[139807.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1422727.1250, grad_fn=<MseLossBackward>)
output :  tensor([[158135.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4851e+10, grad_fn=<MseLossBackward>)
output :  tensor([[150738.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(9993699., grad_fn=<MseLossBackward>)
output :  tensor([[130860.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(1851704.3750, grad_fn=<MseLossBackward>)
output :  tensor([[245498.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7689e+10, grad_fn=<MseLossBackward>)
output :  tensor([[401031.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(938113.3125, grad_fn=<MseLossBackward>)
output :  tensor([[121247.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5001e+08, grad_fn=<MseLossBackward>)
output :  tensor([[116288.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(4892183.5000, grad_fn=<MseLossBackward>)
output :  tensor([[157356.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(4592918., grad_fn=<MseLossBackward>)
output :  tensor([[131364.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1237e+08, grad_fn=<MseLossBackward>)
output :  tensor([[161817.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6220e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174400.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1475e+09, grad_fn=<MseLossBackward>)
output :  tensor([[104037.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(191775.5625, grad_fn=<MseLossBackward>)
output :  tensor([[139522.]], grad_fn=<AddmmBackward>)
loss:  tensor(2184484., grad_fn=<MseLossBackward>)
output :  tensor([[361899.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(29101642., grad_fn=<MseLossBackward>)
output :  tensor([[205388.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3630e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174589.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(829750.1875, grad_fn=<MseLossBackward>)
output :  tensor([[205310.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(5812318.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138154.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(715530.9375, grad_fn=<MseLossBackward>)
output :  tensor([[193797.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(493330.6250, grad_fn=<MseLossBackward>)
output :  tensor([[134720.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4095e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180382.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(381248.3750, grad_fn=<MseLossBackward>)
output :  tensor([[240969.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1062896.6250, grad_fn=<MseLossBackward>)
output :  tensor([[176219.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(4928053., grad_fn=<MseLossBackward>)
output :  tensor([[110588.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(6702718.5000, grad_fn=<MseLossBackward>)
output :  tensor([[264574.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(177.2227, grad_fn=<MseLossBackward>)
output :  tensor([[256088.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(37067928., grad_fn=<MseLossBackward>)
output :  tensor([[125109.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(4451803.5000, grad_fn=<MseLossBackward>)
output :  tensor([[215221.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5734e+09, grad_fn=<MseLossBackward>)
output :  tensor([[306069.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6981e+08, grad_fn=<MseLossBackward>)
output :  tensor([[207573.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(328472.2500, grad_fn=<MseLossBackward>)
output :  tensor([[214692.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5702e+10, grad_fn=<MseLossBackward>)
output :  tensor([[158626.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(527393.6875, grad_fn=<MseLossBackward>)
output :  tensor([[167504.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(6177011., grad_fn=<MseLossBackward>)
output :  tensor([[161268.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(18807130., grad_fn=<MseLossBackward>)
output :  tensor([[173542.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(12549638., grad_fn=<MseLossBackward>)
output :  tensor([[235235.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0735e+09, grad_fn=<MseLossBackward>)
output :  tensor([[219468.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(99752968., grad_fn=<MseLossBackward>)
output :  tensor([[161151.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0028e+08, grad_fn=<MseLossBackward>)
output :  tensor([[127482.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(20093646., grad_fn=<MseLossBackward>)
output :  tensor([[176169.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(689366.9375, grad_fn=<MseLossBackward>)
output :  tensor([[180606.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3033e+09, grad_fn=<MseLossBackward>)
output :  tensor([[207112.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5158e+10, grad_fn=<MseLossBackward>)
output :  tensor([[137570.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(9852536., grad_fn=<MseLossBackward>)
output :  tensor([[151097.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7011e+08, grad_fn=<MseLossBackward>)
output :  tensor([[272719.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(18321878., grad_fn=<MseLossBackward>)
output :  tensor([[89579.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(20971248., grad_fn=<MseLossBackward>)
output :  tensor([[237429.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(864173.5625, grad_fn=<MseLossBackward>)
output :  tensor([[254980.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0755e+11, grad_fn=<MseLossBackward>)
output :  tensor([[169236.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(583194.7500, grad_fn=<MseLossBackward>)
output :  tensor([[193965.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6838e+09, grad_fn=<MseLossBackward>)
output :  tensor([[154206.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(630386.3750, grad_fn=<MseLossBackward>)
output :  tensor([[205505.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1595e+09, grad_fn=<MseLossBackward>)
output :  tensor([[128628.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(137936.7969, grad_fn=<MseLossBackward>)
output :  tensor([[146152.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1328544.3750, grad_fn=<MseLossBackward>)
output :  tensor([[171740.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5501e+08, grad_fn=<MseLossBackward>)
output :  tensor([[184991.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(736780.8125, grad_fn=<MseLossBackward>)
output :  tensor([[132994.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(48924996., grad_fn=<MseLossBackward>)
output :  tensor([[139754.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(10592177., grad_fn=<MseLossBackward>)
output :  tensor([[168853.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(17190094., grad_fn=<MseLossBackward>)
output :  tensor([[201750.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3280e+09, grad_fn=<MseLossBackward>)
output :  tensor([[237121.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(34552536., grad_fn=<MseLossBackward>)
output :  tensor([[154990.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(81.8459, grad_fn=<MseLossBackward>)
output :  tensor([[197309.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1714994.8750, grad_fn=<MseLossBackward>)
output :  tensor([[165318.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5447e+08, grad_fn=<MseLossBackward>)
output :  tensor([[171782.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(59565352., grad_fn=<MseLossBackward>)
output :  tensor([[182559.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(7075184.5000, grad_fn=<MseLossBackward>)
output :  tensor([[94273.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(7436230.5000, grad_fn=<MseLossBackward>)
output :  tensor([[172059.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1651e+10, grad_fn=<MseLossBackward>)
output :  tensor([[135952.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(908000.5625, grad_fn=<MseLossBackward>)
output :  tensor([[121246.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(39022668., grad_fn=<MseLossBackward>)
output :  tensor([[170929.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(9425092., grad_fn=<MseLossBackward>)
output :  tensor([[91242.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(38974560., grad_fn=<MseLossBackward>)
output :  tensor([[281181.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(77767048., grad_fn=<MseLossBackward>)
output :  tensor([[171010.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(36122352., grad_fn=<MseLossBackward>)
output :  tensor([[194904.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9117e+10, grad_fn=<MseLossBackward>)
output :  tensor([[243317.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6633e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148436.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(6569770., grad_fn=<MseLossBackward>)
output :  tensor([[121952.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(4193504., grad_fn=<MseLossBackward>)
output :  tensor([[119283.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(379648.5312, grad_fn=<MseLossBackward>)
output :  tensor([[149668.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2019e+09, grad_fn=<MseLossBackward>)
output :  tensor([[172999.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1000343.7500, grad_fn=<MseLossBackward>)
output :  tensor([[114155.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0020e+09, grad_fn=<MseLossBackward>)
output :  tensor([[212071.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1221e+10, grad_fn=<MseLossBackward>)
output :  tensor([[232489.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(81191360., grad_fn=<MseLossBackward>)
output :  tensor([[249887.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1113e+10, grad_fn=<MseLossBackward>)
output :  tensor([[221753.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9744e+08, grad_fn=<MseLossBackward>)
output :  tensor([[196517.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4157e+10, grad_fn=<MseLossBackward>)
output :  tensor([[186564.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(874458.7500, grad_fn=<MseLossBackward>)
output :  tensor([[209420.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6418e+10, grad_fn=<MseLossBackward>)
output :  tensor([[191687.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0826e+10, grad_fn=<MseLossBackward>)
output :  tensor([[175387.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(11239675., grad_fn=<MseLossBackward>)
output :  tensor([[153843.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(3399644.5000, grad_fn=<MseLossBackward>)
output :  tensor([[332879.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(16978778., grad_fn=<MseLossBackward>)
output :  tensor([[213686.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2843966., grad_fn=<MseLossBackward>)
output :  tensor([[161195.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1428697.2500, grad_fn=<MseLossBackward>)
output :  tensor([[186556.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0188e+09, grad_fn=<MseLossBackward>)
output :  tensor([[106617.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(2617797.5000, grad_fn=<MseLossBackward>)
output :  tensor([[275707.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8004e+10, grad_fn=<MseLossBackward>)
output :  tensor([[168681.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(27233068., grad_fn=<MseLossBackward>)
output :  tensor([[218149.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(21614218., grad_fn=<MseLossBackward>)
output :  tensor([[208018.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6851e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180033.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(695060.8750, grad_fn=<MseLossBackward>)
output :  tensor([[198837.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(8773537., grad_fn=<MseLossBackward>)
output :  tensor([[158705.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(13730267., grad_fn=<MseLossBackward>)
output :  tensor([[147964.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3006e+09, grad_fn=<MseLossBackward>)
output :  tensor([[118220.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(78142.0859, grad_fn=<MseLossBackward>)
output :  tensor([[143234.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(10461182., grad_fn=<MseLossBackward>)
output :  tensor([[151313.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(5352210., grad_fn=<MseLossBackward>)
output :  tensor([[201087.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6107e+10, grad_fn=<MseLossBackward>)
output :  tensor([[161016.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2299440.5000, grad_fn=<MseLossBackward>)
output :  tensor([[102170.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(7130694., grad_fn=<MseLossBackward>)
output :  tensor([[227521.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5572e+08, grad_fn=<MseLossBackward>)
output :  tensor([[184557.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6318e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176745.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(67665.0156, grad_fn=<MseLossBackward>)
output :  tensor([[79408.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(6714819.5000, grad_fn=<MseLossBackward>)
output :  tensor([[131250.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(7564390.5000, grad_fn=<MseLossBackward>)
output :  tensor([[219580.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(31143724., grad_fn=<MseLossBackward>)
output :  tensor([[143188.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(658430.8125, grad_fn=<MseLossBackward>)
output :  tensor([[133561.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(12682168., grad_fn=<MseLossBackward>)
output :  tensor([[145836.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(10475033., grad_fn=<MseLossBackward>)
output :  tensor([[177538.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6031e+09, grad_fn=<MseLossBackward>)
output :  tensor([[147020.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(9124553., grad_fn=<MseLossBackward>)
output :  tensor([[160235.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(55394.0352, grad_fn=<MseLossBackward>)
output :  tensor([[212127.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(8254039., grad_fn=<MseLossBackward>)
output :  tensor([[137760.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0733e+09, grad_fn=<MseLossBackward>)
output :  tensor([[258523.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(12412630., grad_fn=<MseLossBackward>)
output :  tensor([[156923.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(6639962.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128360.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(19351.4180, grad_fn=<MseLossBackward>)
output :  tensor([[96008.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(1016741.3750, grad_fn=<MseLossBackward>)
output :  tensor([[152403.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6109e+09, grad_fn=<MseLossBackward>)
output :  tensor([[181680.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(3170959.2500, grad_fn=<MseLossBackward>)
output :  tensor([[120692.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(36939.0391, grad_fn=<MseLossBackward>)
output :  tensor([[187037.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7567e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144796.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2637e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150572.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(452907.9688, grad_fn=<MseLossBackward>)
output :  tensor([[186231.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2306601.5000, grad_fn=<MseLossBackward>)
output :  tensor([[251484.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7300e+09, grad_fn=<MseLossBackward>)
output :  tensor([[91933.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(188213.6250, grad_fn=<MseLossBackward>)
output :  tensor([[240199.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(39706.7891, grad_fn=<MseLossBackward>)
output :  tensor([[128738.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(56725.8438, grad_fn=<MseLossBackward>)
output :  tensor([[164877.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0206e+10, grad_fn=<MseLossBackward>)
output :  tensor([[113768.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8958e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179948.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(15591393., grad_fn=<MseLossBackward>)
output :  tensor([[165139.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6251e+08, grad_fn=<MseLossBackward>)
output :  tensor([[155859.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4310e+08, grad_fn=<MseLossBackward>)
output :  tensor([[236730.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(5150488.5000, grad_fn=<MseLossBackward>)
output :  tensor([[226924.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6566e+08, grad_fn=<MseLossBackward>)
output :  tensor([[125966.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(1068622.8750, grad_fn=<MseLossBackward>)
output :  tensor([[129822.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(14611566., grad_fn=<MseLossBackward>)
output :  tensor([[222293.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(22152172., grad_fn=<MseLossBackward>)
output :  tensor([[230007.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(15942676., grad_fn=<MseLossBackward>)
output :  tensor([[224320.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(5660607.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144858.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(9869415., grad_fn=<MseLossBackward>)
output :  tensor([[202108.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(62279964., grad_fn=<MseLossBackward>)
output :  tensor([[130015.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0031e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133288.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(622003.3125, grad_fn=<MseLossBackward>)
output :  tensor([[311407.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(12903138., grad_fn=<MseLossBackward>)
output :  tensor([[142557.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2426828.5000, grad_fn=<MseLossBackward>)
output :  tensor([[120712.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8850e+09, grad_fn=<MseLossBackward>)
output :  tensor([[110741.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1542175.8750, grad_fn=<MseLossBackward>)
output :  tensor([[155321.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9511e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181385.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7123e+09, grad_fn=<MseLossBackward>)
output :  tensor([[176474.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(12068785., grad_fn=<MseLossBackward>)
output :  tensor([[192281.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(76010336., grad_fn=<MseLossBackward>)
output :  tensor([[104362.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(19035292., grad_fn=<MseLossBackward>)
output :  tensor([[177581.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2013516.6250, grad_fn=<MseLossBackward>)
output :  tensor([[168753.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(728995.8125, grad_fn=<MseLossBackward>)
output :  tensor([[134726.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(18265740., grad_fn=<MseLossBackward>)
output :  tensor([[260392.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(9.7432e+09, grad_fn=<MseLossBackward>)
output :  tensor([[141956.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2440e+09, grad_fn=<MseLossBackward>)
output :  tensor([[172665.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(112057.5625, grad_fn=<MseLossBackward>)
output :  tensor([[141050.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1103025., grad_fn=<MseLossBackward>)
output :  tensor([[200132.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(135309.0312, grad_fn=<MseLossBackward>)
output :  tensor([[167971.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4113037.5000, grad_fn=<MseLossBackward>)
output :  tensor([[243137.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(743717.5625, grad_fn=<MseLossBackward>)
output :  tensor([[133440.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1122474., grad_fn=<MseLossBackward>)
output :  tensor([[151039.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2855255., grad_fn=<MseLossBackward>)
output :  tensor([[212910.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(4364117., grad_fn=<MseLossBackward>)
output :  tensor([[166152.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1328940.6250, grad_fn=<MseLossBackward>)
output :  tensor([[191681.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(7192872.5000, grad_fn=<MseLossBackward>)
output :  tensor([[132648.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9439e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128030.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(940127.1875, grad_fn=<MseLossBackward>)
output :  tensor([[141546.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2392290.5000, grad_fn=<MseLossBackward>)
output :  tensor([[202727.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4586e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166171.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6185e+09, grad_fn=<MseLossBackward>)
output :  tensor([[76476.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7147e+08, grad_fn=<MseLossBackward>)
output :  tensor([[92359.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(61778372., grad_fn=<MseLossBackward>)
output :  tensor([[248148.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(26469256., grad_fn=<MseLossBackward>)
output :  tensor([[203629.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1770e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113974.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(1051730.3750, grad_fn=<MseLossBackward>)
output :  tensor([[160921.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0639e+08, grad_fn=<MseLossBackward>)
output :  tensor([[206283.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8814e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178795.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3183e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157154.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(4641601., grad_fn=<MseLossBackward>)
output :  tensor([[171986.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3946803., grad_fn=<MseLossBackward>)
output :  tensor([[119823.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(23264570., grad_fn=<MseLossBackward>)
output :  tensor([[163347.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(69684928., grad_fn=<MseLossBackward>)
output :  tensor([[191601.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3403e+08, grad_fn=<MseLossBackward>)
output :  tensor([[217426.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(4300568.5000, grad_fn=<MseLossBackward>)
output :  tensor([[244982.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5002e+11, grad_fn=<MseLossBackward>)
output :  tensor([[146087.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(833454.8750, grad_fn=<MseLossBackward>)
output :  tensor([[109599.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(1253472.6250, grad_fn=<MseLossBackward>)
output :  tensor([[168811.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7131e+08, grad_fn=<MseLossBackward>)
output :  tensor([[156637.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(37674468., grad_fn=<MseLossBackward>)
output :  tensor([[236861.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(19100.1035, grad_fn=<MseLossBackward>)
output :  tensor([[115208.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(43277., grad_fn=<MseLossBackward>)
output :  tensor([[185091.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(4801371., grad_fn=<MseLossBackward>)
output :  tensor([[185814.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(784497.6875, grad_fn=<MseLossBackward>)
output :  tensor([[162645.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4760e+10, grad_fn=<MseLossBackward>)
output :  tensor([[95698.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1605e+08, grad_fn=<MseLossBackward>)
output :  tensor([[245034.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(36419152., grad_fn=<MseLossBackward>)
output :  tensor([[177454.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2114297.7500, grad_fn=<MseLossBackward>)
output :  tensor([[139402.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(356856.8750, grad_fn=<MseLossBackward>)
output :  tensor([[236515.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2295840.5000, grad_fn=<MseLossBackward>)
output :  tensor([[166068.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(9414254., grad_fn=<MseLossBackward>)
output :  tensor([[203718.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4709e+10, grad_fn=<MseLossBackward>)
output :  tensor([[133100.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(3607922.2500, grad_fn=<MseLossBackward>)
output :  tensor([[185250.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4061e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133080.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(8522477., grad_fn=<MseLossBackward>)
output :  tensor([[226836.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(83976888., grad_fn=<MseLossBackward>)
output :  tensor([[223573.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9835e+08, grad_fn=<MseLossBackward>)
output :  tensor([[90198.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(39389.8438, grad_fn=<MseLossBackward>)
output :  tensor([[159453.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(398.1272, grad_fn=<MseLossBackward>)
output :  tensor([[243813.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6145e+10, grad_fn=<MseLossBackward>)
output :  tensor([[146533.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2351478.5000, grad_fn=<MseLossBackward>)
output :  tensor([[109291.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7886e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166265.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(3115445.7500, grad_fn=<MseLossBackward>)
output :  tensor([[144962.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(926285.9375, grad_fn=<MseLossBackward>)
output :  tensor([[128693.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(243519.1250, grad_fn=<MseLossBackward>)
output :  tensor([[189397.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8445e+09, grad_fn=<MseLossBackward>)
output :  tensor([[123231.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(534589.4375, grad_fn=<MseLossBackward>)
output :  tensor([[154507.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(6289045., grad_fn=<MseLossBackward>)
output :  tensor([[170717.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1065282., grad_fn=<MseLossBackward>)
output :  tensor([[149366.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2667760.7500, grad_fn=<MseLossBackward>)
output :  tensor([[162753.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(21475.9863, grad_fn=<MseLossBackward>)
output :  tensor([[135854.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2115e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130985.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(1029479.7500, grad_fn=<MseLossBackward>)
output :  tensor([[154045.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2638e+08, grad_fn=<MseLossBackward>)
output :  tensor([[144720.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(323138.9688, grad_fn=<MseLossBackward>)
output :  tensor([[161547.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(40822.9414, grad_fn=<MseLossBackward>)
output :  tensor([[137329.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5236e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148206.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(352520.5000, grad_fn=<MseLossBackward>)
output :  tensor([[186633.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1868646.2500, grad_fn=<MseLossBackward>)
output :  tensor([[167709.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1665793.5000, grad_fn=<MseLossBackward>)
output :  tensor([[181752.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3071913.5000, grad_fn=<MseLossBackward>)
output :  tensor([[225068.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(25694602., grad_fn=<MseLossBackward>)
output :  tensor([[108181.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(79378.6641, grad_fn=<MseLossBackward>)
output :  tensor([[136382.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3185e+08, grad_fn=<MseLossBackward>)
output :  tensor([[283155.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(8093136., grad_fn=<MseLossBackward>)
output :  tensor([[119339.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(11155496., grad_fn=<MseLossBackward>)
output :  tensor([[174114.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1055e+09, grad_fn=<MseLossBackward>)
output :  tensor([[190841.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(34124948., grad_fn=<MseLossBackward>)
output :  tensor([[186224.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(524243.8750, grad_fn=<MseLossBackward>)
output :  tensor([[252515.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0554e+08, grad_fn=<MseLossBackward>)
output :  tensor([[220944.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1114707., grad_fn=<MseLossBackward>)
output :  tensor([[130750.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1754e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174615.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6723e+08, grad_fn=<MseLossBackward>)
output :  tensor([[124679.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(461412.4062, grad_fn=<MseLossBackward>)
output :  tensor([[184259.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4781e+10, grad_fn=<MseLossBackward>)
output :  tensor([[149881.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(9726407., grad_fn=<MseLossBackward>)
output :  tensor([[155510.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(81197560., grad_fn=<MseLossBackward>)
output :  tensor([[205321.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(958379.8125, grad_fn=<MseLossBackward>)
output :  tensor([[145023.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5685e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175777.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(49443.6914, grad_fn=<MseLossBackward>)
output :  tensor([[251341.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9288e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148362.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(131360.9375, grad_fn=<MseLossBackward>)
output :  tensor([[201047.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2617317.2500, grad_fn=<MseLossBackward>)
output :  tensor([[160722.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(596514.8750, grad_fn=<MseLossBackward>)
output :  tensor([[125912.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4373e+09, grad_fn=<MseLossBackward>)
output :  tensor([[140067.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(18644044., grad_fn=<MseLossBackward>)
output :  tensor([[182875.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1264394.8750, grad_fn=<MseLossBackward>)
output :  tensor([[194566.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(20849640., grad_fn=<MseLossBackward>)
output :  tensor([[222398.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4358e+09, grad_fn=<MseLossBackward>)
output :  tensor([[255060.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(3762812., grad_fn=<MseLossBackward>)
output :  tensor([[186415.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7579e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145414.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9068e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145227.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(529620.0625, grad_fn=<MseLossBackward>)
output :  tensor([[74199.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1696e+09, grad_fn=<MseLossBackward>)
output :  tensor([[128577.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(41242184., grad_fn=<MseLossBackward>)
output :  tensor([[127147.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3071256.2500, grad_fn=<MseLossBackward>)
output :  tensor([[155258.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1582760.6250, grad_fn=<MseLossBackward>)
output :  tensor([[125005.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(3976970.7500, grad_fn=<MseLossBackward>)
output :  tensor([[77729.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1510863.5000, grad_fn=<MseLossBackward>)
output :  tensor([[83620.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2625868.2500, grad_fn=<MseLossBackward>)
output :  tensor([[232293.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(86178.9375, grad_fn=<MseLossBackward>)
output :  tensor([[140778.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9968e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134171.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(13477962., grad_fn=<MseLossBackward>)
output :  tensor([[171161.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(17316392., grad_fn=<MseLossBackward>)
output :  tensor([[234148.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(725398.1875, grad_fn=<MseLossBackward>)
output :  tensor([[184911.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(52257312., grad_fn=<MseLossBackward>)
output :  tensor([[152692.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(10938729., grad_fn=<MseLossBackward>)
output :  tensor([[202590.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(21998298., grad_fn=<MseLossBackward>)
output :  tensor([[201798.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2392e+09, grad_fn=<MseLossBackward>)
output :  tensor([[138755.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3082438.5000, grad_fn=<MseLossBackward>)
output :  tensor([[152246.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(7583569.5000, grad_fn=<MseLossBackward>)
output :  tensor([[133822.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(4739397., grad_fn=<MseLossBackward>)
output :  tensor([[196832.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1001e+09, grad_fn=<MseLossBackward>)
output :  tensor([[154823.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(677534.7500, grad_fn=<MseLossBackward>)
output :  tensor([[138670.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0404e+09, grad_fn=<MseLossBackward>)
output :  tensor([[147281.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(5669607.5000, grad_fn=<MseLossBackward>)
output :  tensor([[206693.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(28163254., grad_fn=<MseLossBackward>)
output :  tensor([[104043.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8590e+08, grad_fn=<MseLossBackward>)
output :  tensor([[167602.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(10471.0449, grad_fn=<MseLossBackward>)
output :  tensor([[126731.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1608775.1250, grad_fn=<MseLossBackward>)
output :  tensor([[147018.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(349.8069, grad_fn=<MseLossBackward>)
output :  tensor([[105858.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8901e+09, grad_fn=<MseLossBackward>)
output :  tensor([[139422.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3695165.2500, grad_fn=<MseLossBackward>)
output :  tensor([[238432.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(5919109., grad_fn=<MseLossBackward>)
output :  tensor([[146180.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1394502.6250, grad_fn=<MseLossBackward>)
output :  tensor([[138498.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(997470.3750, grad_fn=<MseLossBackward>)
output :  tensor([[163462.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2576e+09, grad_fn=<MseLossBackward>)
output :  tensor([[267959.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0080e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176234.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1523758.7500, grad_fn=<MseLossBackward>)
output :  tensor([[105996.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(10372526., grad_fn=<MseLossBackward>)
output :  tensor([[201301.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8062e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157115.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(3551929.2500, grad_fn=<MseLossBackward>)
output :  tensor([[161592.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6584e+10, grad_fn=<MseLossBackward>)
output :  tensor([[98904.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(365665.8750, grad_fn=<MseLossBackward>)
output :  tensor([[123302.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(88394.7188, grad_fn=<MseLossBackward>)
output :  tensor([[158900.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(8410634., grad_fn=<MseLossBackward>)
output :  tensor([[139476.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(273757.8750, grad_fn=<MseLossBackward>)
output :  tensor([[199920.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(6387.5059, grad_fn=<MseLossBackward>)
output :  tensor([[143030.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1061704.8750, grad_fn=<MseLossBackward>)
output :  tensor([[261773.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(256827.2344, grad_fn=<MseLossBackward>)
output :  tensor([[126266.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1067e+09, grad_fn=<MseLossBackward>)
output :  tensor([[167893.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(5726972.5000, grad_fn=<MseLossBackward>)
output :  tensor([[185847.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(7034513., grad_fn=<MseLossBackward>)
output :  tensor([[122632.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5959e+08, grad_fn=<MseLossBackward>)
output :  tensor([[253434.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(11797293., grad_fn=<MseLossBackward>)
output :  tensor([[158680.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0197e+08, grad_fn=<MseLossBackward>)
output :  tensor([[241486.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(14927840., grad_fn=<MseLossBackward>)
output :  tensor([[146558.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(6547841.5000, grad_fn=<MseLossBackward>)
output :  tensor([[210197.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(38895.2344, grad_fn=<MseLossBackward>)
output :  tensor([[174748.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(5516480., grad_fn=<MseLossBackward>)
output :  tensor([[150858.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(9866372., grad_fn=<MseLossBackward>)
output :  tensor([[119458.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2126675.2500, grad_fn=<MseLossBackward>)
output :  tensor([[237087.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5002e+09, grad_fn=<MseLossBackward>)
output :  tensor([[236639.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(11294746., grad_fn=<MseLossBackward>)
output :  tensor([[151896.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2074410.1250, grad_fn=<MseLossBackward>)
output :  tensor([[250841.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(16469900., grad_fn=<MseLossBackward>)
output :  tensor([[126296.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3907e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175441.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(311852.4375, grad_fn=<MseLossBackward>)
output :  tensor([[162115.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(4476398., grad_fn=<MseLossBackward>)
output :  tensor([[132796.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3229152.7500, grad_fn=<MseLossBackward>)
output :  tensor([[192006.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9071e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163639.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(129757.5469, grad_fn=<MseLossBackward>)
output :  tensor([[161355.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2705048.2500, grad_fn=<MseLossBackward>)
output :  tensor([[158664.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(441975.6562, grad_fn=<MseLossBackward>)
output :  tensor([[146958.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(8649941., grad_fn=<MseLossBackward>)
output :  tensor([[172043.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9117e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161046.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1095227.6250, grad_fn=<MseLossBackward>)
output :  tensor([[375199.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(76913448., grad_fn=<MseLossBackward>)
output :  tensor([[125722.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1632126., grad_fn=<MseLossBackward>)
output :  tensor([[128240.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8267e+09, grad_fn=<MseLossBackward>)
output :  tensor([[280445.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(589680., grad_fn=<MseLossBackward>)
output :  tensor([[162615.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(379436.7500, grad_fn=<MseLossBackward>)
output :  tensor([[132076.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3402e+08, grad_fn=<MseLossBackward>)
output :  tensor([[231565.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(189102.6719, grad_fn=<MseLossBackward>)
output :  tensor([[178254.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(5042691.5000, grad_fn=<MseLossBackward>)
output :  tensor([[151872.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(16240.3164, grad_fn=<MseLossBackward>)
output :  tensor([[142941.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(4237229.5000, grad_fn=<MseLossBackward>)
output :  tensor([[154012.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9282e+08, grad_fn=<MseLossBackward>)
output :  tensor([[101328.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(1764767., grad_fn=<MseLossBackward>)
output :  tensor([[76952.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8737e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165607.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(368657.6875, grad_fn=<MseLossBackward>)
output :  tensor([[186401.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7304e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158198.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(39334.0469, grad_fn=<MseLossBackward>)
output :  tensor([[160891.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(11501954., grad_fn=<MseLossBackward>)
output :  tensor([[137593.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(20542.9512, grad_fn=<MseLossBackward>)
output :  tensor([[204118.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(3354564., grad_fn=<MseLossBackward>)
output :  tensor([[139370.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1878013.2500, grad_fn=<MseLossBackward>)
output :  tensor([[182840.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6169e+10, grad_fn=<MseLossBackward>)
output :  tensor([[150971.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(24713482., grad_fn=<MseLossBackward>)
output :  tensor([[109784.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1740e+08, grad_fn=<MseLossBackward>)
output :  tensor([[91112.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(8335355.5000, grad_fn=<MseLossBackward>)
output :  tensor([[176488.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2216888.2500, grad_fn=<MseLossBackward>)
output :  tensor([[258766.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2668169., grad_fn=<MseLossBackward>)
output :  tensor([[142553.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1109006.5000, grad_fn=<MseLossBackward>)
output :  tensor([[159482.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(170104.6875, grad_fn=<MseLossBackward>)
output :  tensor([[132692.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(36882.0039, grad_fn=<MseLossBackward>)
output :  tensor([[145998.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(12257767., grad_fn=<MseLossBackward>)
output :  tensor([[170040.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(4580001.5000, grad_fn=<MseLossBackward>)
output :  tensor([[129054.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(4218948., grad_fn=<MseLossBackward>)
output :  tensor([[172980.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8289e+08, grad_fn=<MseLossBackward>)
output :  tensor([[158704.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2906865.2500, grad_fn=<MseLossBackward>)
output :  tensor([[115725.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(599801.8750, grad_fn=<MseLossBackward>)
output :  tensor([[162073.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0306e+09, grad_fn=<MseLossBackward>)
output :  tensor([[55005.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(9030729., grad_fn=<MseLossBackward>)
output :  tensor([[232893.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3372e+09, grad_fn=<MseLossBackward>)
output :  tensor([[201979.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(960032.5625, grad_fn=<MseLossBackward>)
output :  tensor([[184302.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(486048.6250, grad_fn=<MseLossBackward>)
output :  tensor([[104679.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(1743575.8750, grad_fn=<MseLossBackward>)
output :  tensor([[89917.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(8511943., grad_fn=<MseLossBackward>)
output :  tensor([[141697.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2881665.5000, grad_fn=<MseLossBackward>)
output :  tensor([[220047.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4690e+09, grad_fn=<MseLossBackward>)
output :  tensor([[202986.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(20371824., grad_fn=<MseLossBackward>)
output :  tensor([[167241.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(5025653., grad_fn=<MseLossBackward>)
output :  tensor([[173404.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3897e+09, grad_fn=<MseLossBackward>)
output :  tensor([[190189.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(35833.3086, grad_fn=<MseLossBackward>)
output :  tensor([[88447.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2094080.3750, grad_fn=<MseLossBackward>)
output :  tensor([[137266.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(7469716., grad_fn=<MseLossBackward>)
output :  tensor([[110151.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(121283.5078, grad_fn=<MseLossBackward>)
output :  tensor([[147282.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2819e+08, grad_fn=<MseLossBackward>)
output :  tensor([[171640.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6516e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194688.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0634e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179532.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(218410.1875, grad_fn=<MseLossBackward>)
output :  tensor([[97950.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(2103565., grad_fn=<MseLossBackward>)
output :  tensor([[118384.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(782672., grad_fn=<MseLossBackward>)
output :  tensor([[160332.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6016e+08, grad_fn=<MseLossBackward>)
output :  tensor([[196891.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(9664229., grad_fn=<MseLossBackward>)
output :  tensor([[144670.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(449276.9688, grad_fn=<MseLossBackward>)
train_loss: [2.6162772e+09]
epoch_result tensor([0.])
output :  tensor([[160623.]], grad_fn=<AddmmBackward>)
loss:  tensor(4507129., grad_fn=<MseLossBackward>)
output :  tensor([[122304.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(92696.4609, grad_fn=<MseLossBackward>)
output :  tensor([[195451.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1564883.7500, grad_fn=<MseLossBackward>)
output :  tensor([[176010.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(978924.7500, grad_fn=<MseLossBackward>)
output :  tensor([[153044.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2279e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131931.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(15456201., grad_fn=<MseLossBackward>)
output :  tensor([[141228.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(52247.9609, grad_fn=<MseLossBackward>)
output :  tensor([[116629.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(5619752., grad_fn=<MseLossBackward>)
output :  tensor([[69462.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2017e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165040.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(920760.1875, grad_fn=<MseLossBackward>)
output :  tensor([[130684.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(86771992., grad_fn=<MseLossBackward>)
output :  tensor([[227076.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(4313085.5000, grad_fn=<MseLossBackward>)
output :  tensor([[166342.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(7064050.5000, grad_fn=<MseLossBackward>)
output :  tensor([[243529.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(38072564., grad_fn=<MseLossBackward>)
output :  tensor([[57731.7305]], grad_fn=<AddmmBackward>)
loss:  tensor(7462351.5000, grad_fn=<MseLossBackward>)
output :  tensor([[161414.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8610e+08, grad_fn=<MseLossBackward>)
output :  tensor([[171048.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(15617563., grad_fn=<MseLossBackward>)
output :  tensor([[171600.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2802e+08, grad_fn=<MseLossBackward>)
output :  tensor([[274979.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(438.3789, grad_fn=<MseLossBackward>)
output :  tensor([[198210.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1465915.5000, grad_fn=<MseLossBackward>)
output :  tensor([[137853.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5431e+10, grad_fn=<MseLossBackward>)
output :  tensor([[196160.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(5204101.5000, grad_fn=<MseLossBackward>)
output :  tensor([[179448.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0659e+09, grad_fn=<MseLossBackward>)
output :  tensor([[152299.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1688172.3750, grad_fn=<MseLossBackward>)
output :  tensor([[173831.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(14681829., grad_fn=<MseLossBackward>)
output :  tensor([[86310.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(829508.2500, grad_fn=<MseLossBackward>)
output :  tensor([[170922.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3550e+09, grad_fn=<MseLossBackward>)
output :  tensor([[186579.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2494030.5000, grad_fn=<MseLossBackward>)
output :  tensor([[205491.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5008e+09, grad_fn=<MseLossBackward>)
output :  tensor([[107228.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(7683637.5000, grad_fn=<MseLossBackward>)
output :  tensor([[171004.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(23.6135, grad_fn=<MseLossBackward>)
output :  tensor([[135774.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(526803.8125, grad_fn=<MseLossBackward>)
output :  tensor([[128918.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(6689.4507, grad_fn=<MseLossBackward>)
output :  tensor([[120744.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1549285.8750, grad_fn=<MseLossBackward>)
output :  tensor([[145902.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3536e+08, grad_fn=<MseLossBackward>)
output :  tensor([[168023.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1602e+10, grad_fn=<MseLossBackward>)
output :  tensor([[149314.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(148333.2969, grad_fn=<MseLossBackward>)
output :  tensor([[178085.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3666207.7500, grad_fn=<MseLossBackward>)
output :  tensor([[142033.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1068736., grad_fn=<MseLossBackward>)
output :  tensor([[103731.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8856e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135039.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3937e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137608.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(6804272., grad_fn=<MseLossBackward>)
output :  tensor([[129662.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(7087658.5000, grad_fn=<MseLossBackward>)
output :  tensor([[225285.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(81501.3281, grad_fn=<MseLossBackward>)
output :  tensor([[132877.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(394325.1250, grad_fn=<MseLossBackward>)
output :  tensor([[150259.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1587009.3750, grad_fn=<MseLossBackward>)
output :  tensor([[110867.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(1282644.7500, grad_fn=<MseLossBackward>)
output :  tensor([[162032.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4132707.7500, grad_fn=<MseLossBackward>)
output :  tensor([[141980.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8111e+09, grad_fn=<MseLossBackward>)
output :  tensor([[191083.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(840688.4375, grad_fn=<MseLossBackward>)
output :  tensor([[134113.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(113011.5312, grad_fn=<MseLossBackward>)
output :  tensor([[109636.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(132189.0469, grad_fn=<MseLossBackward>)
output :  tensor([[234850.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(722951.6250, grad_fn=<MseLossBackward>)
output :  tensor([[164817.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3690e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161991.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(8947950., grad_fn=<MseLossBackward>)
output :  tensor([[203167.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8673e+10, grad_fn=<MseLossBackward>)
output :  tensor([[244667.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1954e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145224.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2972822.5000, grad_fn=<MseLossBackward>)
output :  tensor([[133433.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(320922.2500, grad_fn=<MseLossBackward>)
output :  tensor([[152573.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(5886765., grad_fn=<MseLossBackward>)
output :  tensor([[132137.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(4568839.5000, grad_fn=<MseLossBackward>)
output :  tensor([[179368.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5014e+09, grad_fn=<MseLossBackward>)
output :  tensor([[182046.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(4215322.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162727.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1507907.2500, grad_fn=<MseLossBackward>)
output :  tensor([[141211.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(3199347., grad_fn=<MseLossBackward>)
output :  tensor([[145597.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(9596152., grad_fn=<MseLossBackward>)
output :  tensor([[149200.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(17640918., grad_fn=<MseLossBackward>)
output :  tensor([[175003.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1838e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193718.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4201e+08, grad_fn=<MseLossBackward>)
output :  tensor([[139982.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(12130418., grad_fn=<MseLossBackward>)
output :  tensor([[170091.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(3270502.7500, grad_fn=<MseLossBackward>)
output :  tensor([[176575.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(19578690., grad_fn=<MseLossBackward>)
output :  tensor([[115840.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(706466.5000, grad_fn=<MseLossBackward>)
output :  tensor([[221146.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(21508.0547, grad_fn=<MseLossBackward>)
output :  tensor([[181708.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(3209304.2500, grad_fn=<MseLossBackward>)
output :  tensor([[128354.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(8145762., grad_fn=<MseLossBackward>)
output :  tensor([[195953.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(298457.3438, grad_fn=<MseLossBackward>)
output :  tensor([[171709.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(10177795., grad_fn=<MseLossBackward>)
output :  tensor([[208057.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1752e+10, grad_fn=<MseLossBackward>)
output :  tensor([[209415.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2510590.7500, grad_fn=<MseLossBackward>)
output :  tensor([[166360.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2504e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194164.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(112350.6562, grad_fn=<MseLossBackward>)
output :  tensor([[112256.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(552467., grad_fn=<MseLossBackward>)
output :  tensor([[115181.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(7189353., grad_fn=<MseLossBackward>)
output :  tensor([[108946.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(9324578., grad_fn=<MseLossBackward>)
output :  tensor([[146281.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(268340.1875, grad_fn=<MseLossBackward>)
output :  tensor([[159197.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3652e+10, grad_fn=<MseLossBackward>)
output :  tensor([[179303.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(484938.1250, grad_fn=<MseLossBackward>)
output :  tensor([[130274.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(7697937., grad_fn=<MseLossBackward>)
output :  tensor([[143162.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3377267.7500, grad_fn=<MseLossBackward>)
output :  tensor([[181662.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1867e+09, grad_fn=<MseLossBackward>)
output :  tensor([[118844.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(3782690.7500, grad_fn=<MseLossBackward>)
output :  tensor([[196628.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(138116.7500, grad_fn=<MseLossBackward>)
output :  tensor([[144610.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(152087.8125, grad_fn=<MseLossBackward>)
output :  tensor([[212628.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(73797.1172, grad_fn=<MseLossBackward>)
output :  tensor([[128734.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(7479071., grad_fn=<MseLossBackward>)
output :  tensor([[245962.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(5594629.5000, grad_fn=<MseLossBackward>)
output :  tensor([[238742.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1397e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146166.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1804e+08, grad_fn=<MseLossBackward>)
output :  tensor([[85873.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1867e+08, grad_fn=<MseLossBackward>)
output :  tensor([[194124.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5247e+09, grad_fn=<MseLossBackward>)
output :  tensor([[83076.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(4312014.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140029.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(280817.1875, grad_fn=<MseLossBackward>)
output :  tensor([[77090.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2529044.2500, grad_fn=<MseLossBackward>)
output :  tensor([[144257.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1701068., grad_fn=<MseLossBackward>)
output :  tensor([[174500.]], grad_fn=<AddmmBackward>)
loss:  tensor(2250000., grad_fn=<MseLossBackward>)
output :  tensor([[154494.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(988843.8125, grad_fn=<MseLossBackward>)
output :  tensor([[109448.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(4195552., grad_fn=<MseLossBackward>)
output :  tensor([[203573.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2584e+10, grad_fn=<MseLossBackward>)
output :  tensor([[128290.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(43805.1836, grad_fn=<MseLossBackward>)
output :  tensor([[267096.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6651e+08, grad_fn=<MseLossBackward>)
output :  tensor([[303899.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(37212668., grad_fn=<MseLossBackward>)
output :  tensor([[108920.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(2017176.6250, grad_fn=<MseLossBackward>)
output :  tensor([[172106.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(154596.4062, grad_fn=<MseLossBackward>)
output :  tensor([[132383.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9455e+08, grad_fn=<MseLossBackward>)
output :  tensor([[141523.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(6370497., grad_fn=<MseLossBackward>)
output :  tensor([[131201.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(905857.8125, grad_fn=<MseLossBackward>)
output :  tensor([[125625.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(391348., grad_fn=<MseLossBackward>)
output :  tensor([[136342.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2053e+08, grad_fn=<MseLossBackward>)
output :  tensor([[226024.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8799e+10, grad_fn=<MseLossBackward>)
output :  tensor([[188036.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3398e+10, grad_fn=<MseLossBackward>)
output :  tensor([[142051.]], grad_fn=<AddmmBackward>)
loss:  tensor(3418801., grad_fn=<MseLossBackward>)
output :  tensor([[131348.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(14808427., grad_fn=<MseLossBackward>)
output :  tensor([[113899.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(7019850., grad_fn=<MseLossBackward>)
output :  tensor([[254641.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0220e+09, grad_fn=<MseLossBackward>)
output :  tensor([[132525.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(6123537., grad_fn=<MseLossBackward>)
output :  tensor([[200112.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(8337476., grad_fn=<MseLossBackward>)
output :  tensor([[111591.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(44780980., grad_fn=<MseLossBackward>)
output :  tensor([[138613.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1786524.6250, grad_fn=<MseLossBackward>)
output :  tensor([[206546.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2233e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178598.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1692966.8750, grad_fn=<MseLossBackward>)
output :  tensor([[185218.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(47598.9688, grad_fn=<MseLossBackward>)
output :  tensor([[163166.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1267e+10, grad_fn=<MseLossBackward>)
output :  tensor([[301813.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1013e+09, grad_fn=<MseLossBackward>)
output :  tensor([[198494.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(353969.2188, grad_fn=<MseLossBackward>)
output :  tensor([[262151.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9799e+10, grad_fn=<MseLossBackward>)
output :  tensor([[221374.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9914e+09, grad_fn=<MseLossBackward>)
output :  tensor([[281698.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2462e+09, grad_fn=<MseLossBackward>)
output :  tensor([[222884.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1245107.2500, grad_fn=<MseLossBackward>)
output :  tensor([[222385.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8769e+10, grad_fn=<MseLossBackward>)
output :  tensor([[195627.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1884399.6250, grad_fn=<MseLossBackward>)
output :  tensor([[159249.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(9.1506e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133514.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1029178.5625, grad_fn=<MseLossBackward>)
output :  tensor([[136174.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(454655.2188, grad_fn=<MseLossBackward>)
output :  tensor([[91457.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(209370.5938, grad_fn=<MseLossBackward>)
output :  tensor([[109080.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1166872.5000, grad_fn=<MseLossBackward>)
output :  tensor([[271982.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2396e+09, grad_fn=<MseLossBackward>)
output :  tensor([[234972.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(742.5625, grad_fn=<MseLossBackward>)
output :  tensor([[146221.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1491642.3750, grad_fn=<MseLossBackward>)
output :  tensor([[139262.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(3105690.2500, grad_fn=<MseLossBackward>)
output :  tensor([[172995.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(543837.1250, grad_fn=<MseLossBackward>)
output :  tensor([[147414.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(4683369.5000, grad_fn=<MseLossBackward>)
output :  tensor([[165732.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2758e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166475.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2175993.7500, grad_fn=<MseLossBackward>)
output :  tensor([[137325.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(105919.7344, grad_fn=<MseLossBackward>)
output :  tensor([[187772.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2605e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113716.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2947928., grad_fn=<MseLossBackward>)
output :  tensor([[177785.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(33466768., grad_fn=<MseLossBackward>)
output :  tensor([[118989.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(1021410.2500, grad_fn=<MseLossBackward>)
output :  tensor([[85316.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(2835408.7500, grad_fn=<MseLossBackward>)
output :  tensor([[180608.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(370519.5000, grad_fn=<MseLossBackward>)
output :  tensor([[113948.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(16394148., grad_fn=<MseLossBackward>)
output :  tensor([[239579.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(336128.1875, grad_fn=<MseLossBackward>)
output :  tensor([[245194.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(37739.1328, grad_fn=<MseLossBackward>)
output :  tensor([[131116.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2613577.5000, grad_fn=<MseLossBackward>)
output :  tensor([[105586.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(11375126., grad_fn=<MseLossBackward>)
output :  tensor([[290166.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1605e+10, grad_fn=<MseLossBackward>)
output :  tensor([[174336.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(8048303., grad_fn=<MseLossBackward>)
output :  tensor([[126051.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1105948., grad_fn=<MseLossBackward>)
output :  tensor([[143525.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5154e+08, grad_fn=<MseLossBackward>)
output :  tensor([[199788.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0197e+08, grad_fn=<MseLossBackward>)
output :  tensor([[140166.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(694696.1875, grad_fn=<MseLossBackward>)
output :  tensor([[155164.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5584e+10, grad_fn=<MseLossBackward>)
output :  tensor([[156027.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(4527054., grad_fn=<MseLossBackward>)
output :  tensor([[130640.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1300882.8750, grad_fn=<MseLossBackward>)
output :  tensor([[245805.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7608e+10, grad_fn=<MseLossBackward>)
output :  tensor([[399130.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(8234747.5000, grad_fn=<MseLossBackward>)
output :  tensor([[112682.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(13559483., grad_fn=<MseLossBackward>)
output :  tensor([[123886.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(29014046., grad_fn=<MseLossBackward>)
output :  tensor([[161274.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3149515.7500, grad_fn=<MseLossBackward>)
output :  tensor([[128870.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3150e+08, grad_fn=<MseLossBackward>)
output :  tensor([[161622.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6455e+09, grad_fn=<MseLossBackward>)
output :  tensor([[172889.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9551e+09, grad_fn=<MseLossBackward>)
output :  tensor([[101819.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(3170347.2500, grad_fn=<MseLossBackward>)
output :  tensor([[140088.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(829977.9375, grad_fn=<MseLossBackward>)
output :  tensor([[365849.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2085316.5000, grad_fn=<MseLossBackward>)
output :  tensor([[202361.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6665e+09, grad_fn=<MseLossBackward>)
output :  tensor([[179453.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(15628927., grad_fn=<MseLossBackward>)
output :  tensor([[194388.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(72445632., grad_fn=<MseLossBackward>)
output :  tensor([[138545.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(206300.4844, grad_fn=<MseLossBackward>)
output :  tensor([[192834.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2772745.2500, grad_fn=<MseLossBackward>)
output :  tensor([[135145.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6426e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174775.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(38749456., grad_fn=<MseLossBackward>)
output :  tensor([[242393.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(154633.2812, grad_fn=<MseLossBackward>)
output :  tensor([[172319.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2822715., grad_fn=<MseLossBackward>)
output :  tensor([[108688.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(474215.1562, grad_fn=<MseLossBackward>)
output :  tensor([[265469.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(825031.6250, grad_fn=<MseLossBackward>)
output :  tensor([[249836.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(26885.7500, grad_fn=<MseLossBackward>)
output :  tensor([[118725.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(18274022., grad_fn=<MseLossBackward>)
output :  tensor([[214816.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6220e+09, grad_fn=<MseLossBackward>)
output :  tensor([[302129.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3688e+08, grad_fn=<MseLossBackward>)
output :  tensor([[202857.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(17157846., grad_fn=<MseLossBackward>)
output :  tensor([[212729.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6198e+10, grad_fn=<MseLossBackward>)
output :  tensor([[158800.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(810534.4375, grad_fn=<MseLossBackward>)
output :  tensor([[173864.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(15010661., grad_fn=<MseLossBackward>)
output :  tensor([[159177.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(5044095., grad_fn=<MseLossBackward>)
output :  tensor([[169310.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(475022.5000, grad_fn=<MseLossBackward>)
output :  tensor([[235260.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0719e+09, grad_fn=<MseLossBackward>)
output :  tensor([[215219.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0266e+08, grad_fn=<MseLossBackward>)
output :  tensor([[159649.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6001e+08, grad_fn=<MseLossBackward>)
output :  tensor([[121963.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1075174.6250, grad_fn=<MseLossBackward>)
output :  tensor([[177192.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(37140.5156, grad_fn=<MseLossBackward>)
output :  tensor([[179481.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4832e+09, grad_fn=<MseLossBackward>)
output :  tensor([[207530.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5001e+10, grad_fn=<MseLossBackward>)
output :  tensor([[137165.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(7470314., grad_fn=<MseLossBackward>)
output :  tensor([[148241.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0979e+08, grad_fn=<MseLossBackward>)
output :  tensor([[277802.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(643605.0625, grad_fn=<MseLossBackward>)
output :  tensor([[86584.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2509996.5000, grad_fn=<MseLossBackward>)
output :  tensor([[235678.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(674810.9375, grad_fn=<MseLossBackward>)
output :  tensor([[254687.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0775e+11, grad_fn=<MseLossBackward>)
output :  tensor([[171086.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1181331.2500, grad_fn=<MseLossBackward>)
output :  tensor([[191503.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8919e+09, grad_fn=<MseLossBackward>)
output :  tensor([[153597.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1967093.8750, grad_fn=<MseLossBackward>)
output :  tensor([[205588.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1489e+09, grad_fn=<MseLossBackward>)
output :  tensor([[130245.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(1551211.8750, grad_fn=<MseLossBackward>)
output :  tensor([[143086.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(3661661.7500, grad_fn=<MseLossBackward>)
output :  tensor([[170243.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6969e+08, grad_fn=<MseLossBackward>)
output :  tensor([[186776.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(858344.3750, grad_fn=<MseLossBackward>)
output :  tensor([[129776.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(14262365., grad_fn=<MseLossBackward>)
output :  tensor([[136314.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(34282.8359, grad_fn=<MseLossBackward>)
output :  tensor([[176329.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(11082449., grad_fn=<MseLossBackward>)
output :  tensor([[198450.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6573e+09, grad_fn=<MseLossBackward>)
output :  tensor([[240681.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(5375514.5000, grad_fn=<MseLossBackward>)
output :  tensor([[153352.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2712763.5000, grad_fn=<MseLossBackward>)
output :  tensor([[192681.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(11013168., grad_fn=<MseLossBackward>)
output :  tensor([[161121.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9314e+08, grad_fn=<MseLossBackward>)
output :  tensor([[189788.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0585e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178590.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1714299.2500, grad_fn=<MseLossBackward>)
output :  tensor([[101923.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(24238622., grad_fn=<MseLossBackward>)
output :  tensor([[170942.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1894e+10, grad_fn=<MseLossBackward>)
output :  tensor([[132683.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(5364435., grad_fn=<MseLossBackward>)
output :  tensor([[120674.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(32201546., grad_fn=<MseLossBackward>)
output :  tensor([[170026.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(15791186., grad_fn=<MseLossBackward>)
output :  tensor([[88059.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(9361831., grad_fn=<MseLossBackward>)
output :  tensor([[286057.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(15540103., grad_fn=<MseLossBackward>)
output :  tensor([[170325.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(28361782., grad_fn=<MseLossBackward>)
output :  tensor([[190585.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0330e+10, grad_fn=<MseLossBackward>)
output :  tensor([[245091.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7126e+08, grad_fn=<MseLossBackward>)
output :  tensor([[151251.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(63142.2656, grad_fn=<MseLossBackward>)
output :  tensor([[122343.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(2742465.5000, grad_fn=<MseLossBackward>)
output :  tensor([[124691.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(22960794., grad_fn=<MseLossBackward>)
output :  tensor([[147534.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0585e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174499.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(249156.9688, grad_fn=<MseLossBackward>)
output :  tensor([[110045.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5873e+08, grad_fn=<MseLossBackward>)
output :  tensor([[208428.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2006e+10, grad_fn=<MseLossBackward>)
output :  tensor([[241631.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(17185.5703, grad_fn=<MseLossBackward>)
output :  tensor([[252416.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0385e+10, grad_fn=<MseLossBackward>)
output :  tensor([[221540.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0484e+08, grad_fn=<MseLossBackward>)
output :  tensor([[196304.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4207e+10, grad_fn=<MseLossBackward>)
output :  tensor([[188936.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2063846.5000, grad_fn=<MseLossBackward>)
output :  tensor([[206870.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7524e+10, grad_fn=<MseLossBackward>)
output :  tensor([[190628.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1133e+10, grad_fn=<MseLossBackward>)
output :  tensor([[182612.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(14998435., grad_fn=<MseLossBackward>)
output :  tensor([[151233.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(587210.8750, grad_fn=<MseLossBackward>)
output :  tensor([[333549.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(11905088., grad_fn=<MseLossBackward>)
output :  tensor([[210014.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(3944009.7500, grad_fn=<MseLossBackward>)
output :  tensor([[158400.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2556851., grad_fn=<MseLossBackward>)
output :  tensor([[184583.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2395e+09, grad_fn=<MseLossBackward>)
output :  tensor([[104327.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(452214.2188, grad_fn=<MseLossBackward>)
output :  tensor([[270478.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0953e+10, grad_fn=<MseLossBackward>)
output :  tensor([[169829.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(16565536., grad_fn=<MseLossBackward>)
output :  tensor([[207742.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(33150066., grad_fn=<MseLossBackward>)
output :  tensor([[208069.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6719e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176675.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(6372232.5000, grad_fn=<MseLossBackward>)
output :  tensor([[202211.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(169641.0156, grad_fn=<MseLossBackward>)
output :  tensor([[157225.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(4950972.5000, grad_fn=<MseLossBackward>)
output :  tensor([[149420.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4424e+09, grad_fn=<MseLossBackward>)
output :  tensor([[117368.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(1281300.2500, grad_fn=<MseLossBackward>)
output :  tensor([[139538.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(213039.9375, grad_fn=<MseLossBackward>)
output :  tensor([[145566.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(11787635., grad_fn=<MseLossBackward>)
output :  tensor([[200745.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6194e+10, grad_fn=<MseLossBackward>)
output :  tensor([[160978.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2187348.5000, grad_fn=<MseLossBackward>)
output :  tensor([[100377.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(769444.1875, grad_fn=<MseLossBackward>)
output :  tensor([[226643.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7839e+08, grad_fn=<MseLossBackward>)
output :  tensor([[185580.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0321e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174917.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2458036., grad_fn=<MseLossBackward>)
output :  tensor([[84785.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(7760882., grad_fn=<MseLossBackward>)
output :  tensor([[129175.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(456891.5000, grad_fn=<MseLossBackward>)
output :  tensor([[214514.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(264276.3125, grad_fn=<MseLossBackward>)
output :  tensor([[143442.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(310336.0312, grad_fn=<MseLossBackward>)
output :  tensor([[131305.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1704493.5000, grad_fn=<MseLossBackward>)
output :  tensor([[141843.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(572410.4375, grad_fn=<MseLossBackward>)
output :  tensor([[175831.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4693e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144960.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(923280.7500, grad_fn=<MseLossBackward>)
output :  tensor([[158908.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1191952.1250, grad_fn=<MseLossBackward>)
output :  tensor([[214754.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(60185.8906, grad_fn=<MseLossBackward>)
output :  tensor([[135432.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2614e+08, grad_fn=<MseLossBackward>)
output :  tensor([[256913.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3659927.7500, grad_fn=<MseLossBackward>)
output :  tensor([[161123.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2635600., grad_fn=<MseLossBackward>)
output :  tensor([[133016.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(20396514., grad_fn=<MseLossBackward>)
output :  tensor([[97521.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(6357213.5000, grad_fn=<MseLossBackward>)
output :  tensor([[153758.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7967e+09, grad_fn=<MseLossBackward>)
output :  tensor([[176904.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(8974612., grad_fn=<MseLossBackward>)
output :  tensor([[118841.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(2749870.7500, grad_fn=<MseLossBackward>)
output :  tensor([[187240.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7397e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145154.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3105e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150347.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(200368.1406, grad_fn=<MseLossBackward>)
output :  tensor([[188338.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(346571.3750, grad_fn=<MseLossBackward>)
output :  tensor([[252688.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6313e+09, grad_fn=<MseLossBackward>)
output :  tensor([[90400.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(1209192.3750, grad_fn=<MseLossBackward>)
output :  tensor([[237021.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(8869601., grad_fn=<MseLossBackward>)
output :  tensor([[128029.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(221804.2031, grad_fn=<MseLossBackward>)
output :  tensor([[164877.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0206e+10, grad_fn=<MseLossBackward>)
output :  tensor([[115111.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2835e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180642.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(21552226., grad_fn=<MseLossBackward>)
output :  tensor([[165122.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6166e+08, grad_fn=<MseLossBackward>)
output :  tensor([[156819.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9271e+08, grad_fn=<MseLossBackward>)
output :  tensor([[234285.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(22224596., grad_fn=<MseLossBackward>)
output :  tensor([[224684.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1100e+09, grad_fn=<MseLossBackward>)
output :  tensor([[127420.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(177155.5000, grad_fn=<MseLossBackward>)
output :  tensor([[124519.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(2193199., grad_fn=<MseLossBackward>)
output :  tensor([[226328.]], grad_fn=<AddmmBackward>)
loss:  tensor(451584., grad_fn=<MseLossBackward>)
output :  tensor([[228300.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(32482342., grad_fn=<MseLossBackward>)
output :  tensor([[227852.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1327464., grad_fn=<MseLossBackward>)
output :  tensor([[145458.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(6459857.5000, grad_fn=<MseLossBackward>)
output :  tensor([[210829.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(687474.1875, grad_fn=<MseLossBackward>)
output :  tensor([[129272.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(85974328., grad_fn=<MseLossBackward>)
output :  tensor([[135751.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(10574183., grad_fn=<MseLossBackward>)
output :  tensor([[310973.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(16214967., grad_fn=<MseLossBackward>)
output :  tensor([[139717.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1644165., grad_fn=<MseLossBackward>)
output :  tensor([[119750.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7827e+09, grad_fn=<MseLossBackward>)
output :  tensor([[108547.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(907881.4375, grad_fn=<MseLossBackward>)
output :  tensor([[154055.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4020e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179097.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(9.1447e+09, grad_fn=<MseLossBackward>)
output :  tensor([[175081.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(4333943.5000, grad_fn=<MseLossBackward>)
output :  tensor([[194258.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(45453512., grad_fn=<MseLossBackward>)
output :  tensor([[99086.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(834139.7500, grad_fn=<MseLossBackward>)
output :  tensor([[180630.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2659957.2500, grad_fn=<MseLossBackward>)
output :  tensor([[170674.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(7697763.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139363.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(132314.0625, grad_fn=<MseLossBackward>)
output :  tensor([[258821.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0056e+10, grad_fn=<MseLossBackward>)
output :  tensor([[142987.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3626e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174299.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1688781.5000, grad_fn=<MseLossBackward>)
output :  tensor([[143666.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(13445858., grad_fn=<MseLossBackward>)
output :  tensor([[203031.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(6408729.5000, grad_fn=<MseLossBackward>)
output :  tensor([[170899.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(809353.2500, grad_fn=<MseLossBackward>)
output :  tensor([[242252.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3052063.5000, grad_fn=<MseLossBackward>)
output :  tensor([[133494.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1011533.0625, grad_fn=<MseLossBackward>)
output :  tensor([[150551.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1444616.2500, grad_fn=<MseLossBackward>)
output :  tensor([[213280.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2955229.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163821.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1388494., grad_fn=<MseLossBackward>)
output :  tensor([[188952.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2219.2932, grad_fn=<MseLossBackward>)
output :  tensor([[135043.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7393e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131184.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(4773883.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138745.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1574593.6250, grad_fn=<MseLossBackward>)
output :  tensor([[199912.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8424e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164959.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4959e+09, grad_fn=<MseLossBackward>)
output :  tensor([[76318.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6630e+08, grad_fn=<MseLossBackward>)
output :  tensor([[92510.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(64169360., grad_fn=<MseLossBackward>)
output :  tensor([[252351.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(886657.6250, grad_fn=<MseLossBackward>)
output :  tensor([[202942.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0886e+09, grad_fn=<MseLossBackward>)
output :  tensor([[116111.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(1236179.1250, grad_fn=<MseLossBackward>)
output :  tensor([[158949.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1511e+08, grad_fn=<MseLossBackward>)
output :  tensor([[206585.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7996e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178321.]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4050e+09, grad_fn=<MseLossBackward>)
output :  tensor([[154771.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(52376.6133, grad_fn=<MseLossBackward>)
output :  tensor([[169724.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(75874.4219, grad_fn=<MseLossBackward>)
output :  tensor([[115145.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(21256.7285, grad_fn=<MseLossBackward>)
output :  tensor([[162807.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(60952664., grad_fn=<MseLossBackward>)
output :  tensor([[191621.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3344e+08, grad_fn=<MseLossBackward>)
output :  tensor([[221174.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2802485.2500, grad_fn=<MseLossBackward>)
output :  tensor([[245508.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4949e+11, grad_fn=<MseLossBackward>)
output :  tensor([[150704.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(13725173., grad_fn=<MseLossBackward>)
output :  tensor([[110456.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(3905039.2500, grad_fn=<MseLossBackward>)
output :  tensor([[169953.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4273e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148209.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(5246462., grad_fn=<MseLossBackward>)
output :  tensor([[234622.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(5653249., grad_fn=<MseLossBackward>)
output :  tensor([[113892.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1227525.5000, grad_fn=<MseLossBackward>)
output :  tensor([[175859.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(49567320., grad_fn=<MseLossBackward>)
output :  tensor([[187698.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(996939.8750, grad_fn=<MseLossBackward>)
output :  tensor([[163803.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4397e+10, grad_fn=<MseLossBackward>)
output :  tensor([[96126.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2880e+08, grad_fn=<MseLossBackward>)
output :  tensor([[233632.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(28811566., grad_fn=<MseLossBackward>)
output :  tensor([[177187.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1409970.7500, grad_fn=<MseLossBackward>)
output :  tensor([[140380.]], grad_fn=<AddmmBackward>)
loss:  tensor(144400., grad_fn=<MseLossBackward>)
output :  tensor([[238262.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(10641969., grad_fn=<MseLossBackward>)
output :  tensor([[160097.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(8425595., grad_fn=<MseLossBackward>)
output :  tensor([[203908.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4663e+10, grad_fn=<MseLossBackward>)
output :  tensor([[138084.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(9517129., grad_fn=<MseLossBackward>)
output :  tensor([[185928.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7258e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134941.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1121117., grad_fn=<MseLossBackward>)
output :  tensor([[226202.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(95986720., grad_fn=<MseLossBackward>)
output :  tensor([[226042.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7394e+08, grad_fn=<MseLossBackward>)
output :  tensor([[89667.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(110597.8125, grad_fn=<MseLossBackward>)
output :  tensor([[158278.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1335071.8750, grad_fn=<MseLossBackward>)
output :  tensor([[246243.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5534e+10, grad_fn=<MseLossBackward>)
output :  tensor([[146213.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1472771.8750, grad_fn=<MseLossBackward>)
output :  tensor([[109931.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8431e+09, grad_fn=<MseLossBackward>)
output :  tensor([[162353.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4609542., grad_fn=<MseLossBackward>)
output :  tensor([[143238.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(579144.8125, grad_fn=<MseLossBackward>)
output :  tensor([[127677.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(272957.2812, grad_fn=<MseLossBackward>)
output :  tensor([[189580.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8191e+09, grad_fn=<MseLossBackward>)
output :  tensor([[120444.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(4224438., grad_fn=<MseLossBackward>)
output :  tensor([[154659.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(7074852., grad_fn=<MseLossBackward>)
output :  tensor([[171905.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(24097.7109, grad_fn=<MseLossBackward>)
output :  tensor([[149858.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1303057.8750, grad_fn=<MseLossBackward>)
output :  tensor([[163651.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(564963.6250, grad_fn=<MseLossBackward>)
output :  tensor([[136145.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3688e+08, grad_fn=<MseLossBackward>)
output :  tensor([[132124.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(15461.3682, grad_fn=<MseLossBackward>)
output :  tensor([[155577.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7482e+08, grad_fn=<MseLossBackward>)
output :  tensor([[145001.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(721676.8125, grad_fn=<MseLossBackward>)
output :  tensor([[159144.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(6790584.5000, grad_fn=<MseLossBackward>)
output :  tensor([[137991.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8915e+08, grad_fn=<MseLossBackward>)
output :  tensor([[151173.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(5632315.5000, grad_fn=<MseLossBackward>)
output :  tensor([[185664.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(5454998., grad_fn=<MseLossBackward>)
output :  tensor([[171753.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(7584344., grad_fn=<MseLossBackward>)
output :  tensor([[181073.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1151664.3750, grad_fn=<MseLossBackward>)
output :  tensor([[220265.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(70415.6016, grad_fn=<MseLossBackward>)
output :  tensor([[108902.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(1005491.8750, grad_fn=<MseLossBackward>)
output :  tensor([[136903.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4409e+08, grad_fn=<MseLossBackward>)
output :  tensor([[290182.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(17495658., grad_fn=<MseLossBackward>)
output :  tensor([[116885.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(783543.0625, grad_fn=<MseLossBackward>)
output :  tensor([[174771.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0456e+09, grad_fn=<MseLossBackward>)
output :  tensor([[187146.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(4608938., grad_fn=<MseLossBackward>)
output :  tensor([[191323.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(33916976., grad_fn=<MseLossBackward>)
output :  tensor([[249376.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5656e+08, grad_fn=<MseLossBackward>)
output :  tensor([[220882.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1248142.8750, grad_fn=<MseLossBackward>)
output :  tensor([[125890.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9962e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176223.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3932e+08, grad_fn=<MseLossBackward>)
output :  tensor([[121155.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(8090913.5000, grad_fn=<MseLossBackward>)
output :  tensor([[181380.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6255e+10, grad_fn=<MseLossBackward>)
output :  tensor([[154691.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2862123.7500, grad_fn=<MseLossBackward>)
output :  tensor([[154895.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(70485472., grad_fn=<MseLossBackward>)
output :  tensor([[203237.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(9379385., grad_fn=<MseLossBackward>)
output :  tensor([[145276.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6323e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175096.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(816255.8125, grad_fn=<MseLossBackward>)
output :  tensor([[247955.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9504e+08, grad_fn=<MseLossBackward>)
output :  tensor([[147644.]], grad_fn=<AddmmBackward>)
loss:  tensor(126736., grad_fn=<MseLossBackward>)
output :  tensor([[202670.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(30.9414, grad_fn=<MseLossBackward>)
output :  tensor([[157756.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(4810757., grad_fn=<MseLossBackward>)
output :  tensor([[124029.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2981e+09, grad_fn=<MseLossBackward>)
output :  tensor([[132179.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(12747131., grad_fn=<MseLossBackward>)
output :  tensor([[183388.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(374505.7500, grad_fn=<MseLossBackward>)
output :  tensor([[198805.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(77544536., grad_fn=<MseLossBackward>)
output :  tensor([[228878.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6146e+09, grad_fn=<MseLossBackward>)
output :  tensor([[250534.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(41806932., grad_fn=<MseLossBackward>)
output :  tensor([[186275.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7616e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143122.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6649e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145592.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1192498.1250, grad_fn=<MseLossBackward>)
output :  tensor([[71888.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0169e+09, grad_fn=<MseLossBackward>)
output :  tensor([[140889.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(34690076., grad_fn=<MseLossBackward>)
output :  tensor([[131936.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(9218719., grad_fn=<MseLossBackward>)
output :  tensor([[154776.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(602612.5625, grad_fn=<MseLossBackward>)
output :  tensor([[132149.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(26514454., grad_fn=<MseLossBackward>)
output :  tensor([[77403.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(815931.1250, grad_fn=<MseLossBackward>)
output :  tensor([[83019.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1039953.8125, grad_fn=<MseLossBackward>)
output :  tensor([[220532.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3150e+08, grad_fn=<MseLossBackward>)
output :  tensor([[141504.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4126e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134265.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(14179108., grad_fn=<MseLossBackward>)
output :  tensor([[166552.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(200690., grad_fn=<MseLossBackward>)
output :  tensor([[236573.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2476443.2500, grad_fn=<MseLossBackward>)
output :  tensor([[190043.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(4394133., grad_fn=<MseLossBackward>)
output :  tensor([[153559.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(5955582.5000, grad_fn=<MseLossBackward>)
output :  tensor([[197032.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(753152.7500, grad_fn=<MseLossBackward>)
output :  tensor([[201484.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2613e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137557.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(311346.5625, grad_fn=<MseLossBackward>)
output :  tensor([[155452.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(204968.4219, grad_fn=<MseLossBackward>)
output :  tensor([[136870.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(758096.7500, grad_fn=<MseLossBackward>)
output :  tensor([[196954.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0920e+09, grad_fn=<MseLossBackward>)
output :  tensor([[154688.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(474634.8750, grad_fn=<MseLossBackward>)
output :  tensor([[137373.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9249e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146841.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(3769665., grad_fn=<MseLossBackward>)
output :  tensor([[205012.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(48831924., grad_fn=<MseLossBackward>)
output :  tensor([[103707.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7122e+08, grad_fn=<MseLossBackward>)
output :  tensor([[167200.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(89541.2109, grad_fn=<MseLossBackward>)
output :  tensor([[126888.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1236266., grad_fn=<MseLossBackward>)
output :  tensor([[147293.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(86068.8906, grad_fn=<MseLossBackward>)
output :  tensor([[105992.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9017e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137807.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(94825.5000, grad_fn=<MseLossBackward>)
output :  tensor([[228110.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(62249388., grad_fn=<MseLossBackward>)
output :  tensor([[145018.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(333.0625, grad_fn=<MseLossBackward>)
output :  tensor([[137399.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(10197.8438, grad_fn=<MseLossBackward>)
output :  tensor([[163986.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2950e+09, grad_fn=<MseLossBackward>)
output :  tensor([[267584.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0848e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172887.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(4462326., grad_fn=<MseLossBackward>)
output :  tensor([[105382.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(6792905.5000, grad_fn=<MseLossBackward>)
output :  tensor([[202131.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6803e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163990.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(24900880., grad_fn=<MseLossBackward>)
output :  tensor([[161948.]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6431e+10, grad_fn=<MseLossBackward>)
output :  tensor([[99016.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(513506.5938, grad_fn=<MseLossBackward>)
output :  tensor([[123956.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(127209.2500, grad_fn=<MseLossBackward>)
output :  tensor([[154499.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2250609.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140261.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(68276.0547, grad_fn=<MseLossBackward>)
output :  tensor([[199351.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(420673.8438, grad_fn=<MseLossBackward>)
output :  tensor([[140988.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1022373.7500, grad_fn=<MseLossBackward>)
output :  tensor([[266182.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(15229506., grad_fn=<MseLossBackward>)
output :  tensor([[128635.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2699e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163872.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2647942.5000, grad_fn=<MseLossBackward>)
output :  tensor([[187425.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1155054., grad_fn=<MseLossBackward>)
output :  tensor([[125401.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3721e+08, grad_fn=<MseLossBackward>)
output :  tensor([[249191.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(653167.0625, grad_fn=<MseLossBackward>)
output :  tensor([[157633.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(8.6238e+08, grad_fn=<MseLossBackward>)
output :  tensor([[242067.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(10775832., grad_fn=<MseLossBackward>)
output :  tensor([[143897.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(10442.2852, grad_fn=<MseLossBackward>)
output :  tensor([[208155.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3401142.7500, grad_fn=<MseLossBackward>)
output :  tensor([[172538.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(19264.5723, grad_fn=<MseLossBackward>)
output :  tensor([[153070.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(864406., grad_fn=<MseLossBackward>)
output :  tensor([[121153.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(9947568., grad_fn=<MseLossBackward>)
output :  tensor([[239223.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2912e+09, grad_fn=<MseLossBackward>)
output :  tensor([[237577.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(5869566., grad_fn=<MseLossBackward>)
output :  tensor([[151478.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3453557.7500, grad_fn=<MseLossBackward>)
output :  tensor([[254579.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(102670.1797, grad_fn=<MseLossBackward>)
output :  tensor([[121722.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(52110576., grad_fn=<MseLossBackward>)
output :  tensor([[177387.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1924072.3750, grad_fn=<MseLossBackward>)
output :  tensor([[160719.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(517860.1250, grad_fn=<MseLossBackward>)
output :  tensor([[132348.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1818073., grad_fn=<MseLossBackward>)
output :  tensor([[195363.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3380e+09, grad_fn=<MseLossBackward>)
output :  tensor([[167307.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(10940280., grad_fn=<MseLossBackward>)
output :  tensor([[164928.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(3719473.7500, grad_fn=<MseLossBackward>)
output :  tensor([[156989.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1021236.5625, grad_fn=<MseLossBackward>)
output :  tensor([[151164.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1598367.6250, grad_fn=<MseLossBackward>)
output :  tensor([[176746.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5221e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161763.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(3109987.2500, grad_fn=<MseLossBackward>)
output :  tensor([[377439.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(42652736., grad_fn=<MseLossBackward>)
output :  tensor([[136972.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(99452936., grad_fn=<MseLossBackward>)
output :  tensor([[131123.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0815e+09, grad_fn=<MseLossBackward>)
output :  tensor([[283494.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(5206953.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163435.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2060391.1250, grad_fn=<MseLossBackward>)
output :  tensor([[133588.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7130e+08, grad_fn=<MseLossBackward>)
output :  tensor([[240403.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(70614344., grad_fn=<MseLossBackward>)
output :  tensor([[180684.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(34190.3203, grad_fn=<MseLossBackward>)
output :  tensor([[156362.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(19032496., grad_fn=<MseLossBackward>)
output :  tensor([[143428.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2468826.5000, grad_fn=<MseLossBackward>)
output :  tensor([[159184.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9659e+08, grad_fn=<MseLossBackward>)
output :  tensor([[101243.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(1547438.8750, grad_fn=<MseLossBackward>)
output :  tensor([[76335.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6686e+08, grad_fn=<MseLossBackward>)
output :  tensor([[162767.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(4983707.5000, grad_fn=<MseLossBackward>)
output :  tensor([[188011.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5991e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157311.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(474161.3438, grad_fn=<MseLossBackward>)
output :  tensor([[159411.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3654310.2500, grad_fn=<MseLossBackward>)
output :  tensor([[138474.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1049120.1250, grad_fn=<MseLossBackward>)
output :  tensor([[208508.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(6543763.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139617.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2617620.7500, grad_fn=<MseLossBackward>)
output :  tensor([[182423.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6276e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144420.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2493389., grad_fn=<MseLossBackward>)
output :  tensor([[108430.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4671e+08, grad_fn=<MseLossBackward>)
output :  tensor([[96111.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(4456980.5000, grad_fn=<MseLossBackward>)
output :  tensor([[176500.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2252766.5000, grad_fn=<MseLossBackward>)
output :  tensor([[263730.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(11092855., grad_fn=<MseLossBackward>)
output :  tensor([[141671.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(29380.1016, grad_fn=<MseLossBackward>)
output :  tensor([[159291.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(364344.2812, grad_fn=<MseLossBackward>)
output :  tensor([[133786.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1654318.5000, grad_fn=<MseLossBackward>)
output :  tensor([[147706.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(3216250., grad_fn=<MseLossBackward>)
output :  tensor([[165616.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(5212660., grad_fn=<MseLossBackward>)
output :  tensor([[125151.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(3416028., grad_fn=<MseLossBackward>)
output :  tensor([[173794.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2912e+08, grad_fn=<MseLossBackward>)
output :  tensor([[157361.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(130682.2500, grad_fn=<MseLossBackward>)
output :  tensor([[120331.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(14680033., grad_fn=<MseLossBackward>)
output :  tensor([[161601.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0978e+09, grad_fn=<MseLossBackward>)
output :  tensor([[53666.3711]], grad_fn=<AddmmBackward>)
loss:  tensor(2776792.5000, grad_fn=<MseLossBackward>)
output :  tensor([[232779.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3554e+09, grad_fn=<MseLossBackward>)
output :  tensor([[199996.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1006730.0625, grad_fn=<MseLossBackward>)
output :  tensor([[186879.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(3531404.5000, grad_fn=<MseLossBackward>)
output :  tensor([[107440.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(2074882.7500, grad_fn=<MseLossBackward>)
output :  tensor([[89079.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(4325815., grad_fn=<MseLossBackward>)
output :  tensor([[138623.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1893419., grad_fn=<MseLossBackward>)
output :  tensor([[221046.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3222e+09, grad_fn=<MseLossBackward>)
output :  tensor([[201728.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(33312016., grad_fn=<MseLossBackward>)
output :  tensor([[167155.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(4646719., grad_fn=<MseLossBackward>)
output :  tensor([[173904.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2983e+09, grad_fn=<MseLossBackward>)
output :  tensor([[190118.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(14079.3057, grad_fn=<MseLossBackward>)
output :  tensor([[85881.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(1249976.3750, grad_fn=<MseLossBackward>)
output :  tensor([[138788.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1466823.7500, grad_fn=<MseLossBackward>)
output :  tensor([[110665.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(27390.2500, grad_fn=<MseLossBackward>)
output :  tensor([[148051.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4621e+08, grad_fn=<MseLossBackward>)
output :  tensor([[171568.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6458e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195862.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(83496192., grad_fn=<MseLossBackward>)
output :  tensor([[180367.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(135355.0156, grad_fn=<MseLossBackward>)
output :  tensor([[97189.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(475949.0625, grad_fn=<MseLossBackward>)
output :  tensor([[117825.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(105818.0547, grad_fn=<MseLossBackward>)
output :  tensor([[161654.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9934e+08, grad_fn=<MseLossBackward>)
output :  tensor([[199478.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(272027.4375, grad_fn=<MseLossBackward>)
output :  tensor([[144352.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(124465.6328, grad_fn=<MseLossBackward>)
train_loss: [2.6247043e+09]
epoch_result tensor([0.])
output :  tensor([[158632.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(17684.8438, grad_fn=<MseLossBackward>)
output :  tensor([[121033.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(934288.3750, grad_fn=<MseLossBackward>)
output :  tensor([[190704.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(12222999., grad_fn=<MseLossBackward>)
output :  tensor([[177530.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(281015.9375, grad_fn=<MseLossBackward>)
output :  tensor([[154665.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4450e+08, grad_fn=<MseLossBackward>)
output :  tensor([[125380.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(6862230.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140899.]], grad_fn=<AddmmBackward>)
loss:  tensor(10201., grad_fn=<MseLossBackward>)
output :  tensor([[117678.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(1746548.1250, grad_fn=<MseLossBackward>)
output :  tensor([[66441.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(63073380., grad_fn=<MseLossBackward>)
output :  tensor([[165584.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(172549.3750, grad_fn=<MseLossBackward>)
output :  tensor([[145503.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(30288856., grad_fn=<MseLossBackward>)
output :  tensor([[224497.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(252993.2812, grad_fn=<MseLossBackward>)
output :  tensor([[168121.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(772311.4375, grad_fn=<MseLossBackward>)
output :  tensor([[247663.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(4147332.2500, grad_fn=<MseLossBackward>)
output :  tensor([[55490.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(240176.5625, grad_fn=<MseLossBackward>)
output :  tensor([[164090.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8378e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174631.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(135780.7344, grad_fn=<MseLossBackward>)
output :  tensor([[163527.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(49389928., grad_fn=<MseLossBackward>)
output :  tensor([[276418.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2012674.2500, grad_fn=<MseLossBackward>)
output :  tensor([[194299.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(7293206.5000, grad_fn=<MseLossBackward>)
output :  tensor([[137420.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5669e+10, grad_fn=<MseLossBackward>)
output :  tensor([[193246.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(399621.5312, grad_fn=<MseLossBackward>)
output :  tensor([[176589.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3339e+09, grad_fn=<MseLossBackward>)
output :  tensor([[152208.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1459301.7500, grad_fn=<MseLossBackward>)
output :  tensor([[169933.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(4445.1387, grad_fn=<MseLossBackward>)
output :  tensor([[87402.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(4011508.2500, grad_fn=<MseLossBackward>)
output :  tensor([[170073.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2574e+09, grad_fn=<MseLossBackward>)
output :  tensor([[182524.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(6129570., grad_fn=<MseLossBackward>)
output :  tensor([[205304.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5196e+09, grad_fn=<MseLossBackward>)
output :  tensor([[111559.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(2430505.2500, grad_fn=<MseLossBackward>)
output :  tensor([[169708.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1667488., grad_fn=<MseLossBackward>)
output :  tensor([[138080.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2497832., grad_fn=<MseLossBackward>)
output :  tensor([[129709.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(503046.6562, grad_fn=<MseLossBackward>)
output :  tensor([[121205.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(2907478., grad_fn=<MseLossBackward>)
output :  tensor([[147550.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(9.3334e+08, grad_fn=<MseLossBackward>)
output :  tensor([[168394.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1493e+10, grad_fn=<MseLossBackward>)
output :  tensor([[151650.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3804328.2500, grad_fn=<MseLossBackward>)
output :  tensor([[183594.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(12919981., grad_fn=<MseLossBackward>)
output :  tensor([[143762.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(7631233.5000, grad_fn=<MseLossBackward>)
output :  tensor([[104542.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1148e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137345.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0302e+09, grad_fn=<MseLossBackward>)
output :  tensor([[133836.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1354532.2500, grad_fn=<MseLossBackward>)
output :  tensor([[138737.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3778e+08, grad_fn=<MseLossBackward>)
output :  tensor([[222347.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(7034181.5000, grad_fn=<MseLossBackward>)
output :  tensor([[133000.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(562593.7500, grad_fn=<MseLossBackward>)
output :  tensor([[147918.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1169777.5000, grad_fn=<MseLossBackward>)
output :  tensor([[115001.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(9007877., grad_fn=<MseLossBackward>)
output :  tensor([[160072.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(5272.1211, grad_fn=<MseLossBackward>)
output :  tensor([[142995.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7045e+09, grad_fn=<MseLossBackward>)
output :  tensor([[196047.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(16384407., grad_fn=<MseLossBackward>)
output :  tensor([[136885.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(5933487., grad_fn=<MseLossBackward>)
output :  tensor([[124696.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1600e+08, grad_fn=<MseLossBackward>)
output :  tensor([[231915.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(4343707.5000, grad_fn=<MseLossBackward>)
output :  tensor([[165827.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2717e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151202.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(60796620., grad_fn=<MseLossBackward>)
output :  tensor([[204110.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8355e+10, grad_fn=<MseLossBackward>)
output :  tensor([[245696.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1730e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143354.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(21034.0625, grad_fn=<MseLossBackward>)
output :  tensor([[137262.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(10645130., grad_fn=<MseLossBackward>)
output :  tensor([[157764.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(7644620., grad_fn=<MseLossBackward>)
output :  tensor([[135471.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(29937142., grad_fn=<MseLossBackward>)
output :  tensor([[183771.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8107e+09, grad_fn=<MseLossBackward>)
output :  tensor([[184503.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(162812.2500, grad_fn=<MseLossBackward>)
output :  tensor([[162260.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(578550.3750, grad_fn=<MseLossBackward>)
output :  tensor([[150165.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(51349540., grad_fn=<MseLossBackward>)
output :  tensor([[145222.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(7412942., grad_fn=<MseLossBackward>)
output :  tensor([[141319.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(13543205., grad_fn=<MseLossBackward>)
output :  tensor([[173004.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4464e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192485.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0094e+08, grad_fn=<MseLossBackward>)
output :  tensor([[138368.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(3490183., grad_fn=<MseLossBackward>)
output :  tensor([[172195.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(87061.8750, grad_fn=<MseLossBackward>)
output :  tensor([[180322.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(458667.5625, grad_fn=<MseLossBackward>)
output :  tensor([[112262.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(7496601., grad_fn=<MseLossBackward>)
output :  tensor([[218387.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(6824340., grad_fn=<MseLossBackward>)
output :  tensor([[183735.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(55364.6211, grad_fn=<MseLossBackward>)
output :  tensor([[128310.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(7896495., grad_fn=<MseLossBackward>)
output :  tensor([[197940.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2074410.1250, grad_fn=<MseLossBackward>)
output :  tensor([[174980.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(6422.5195, grad_fn=<MseLossBackward>)
output :  tensor([[208831.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1477e+10, grad_fn=<MseLossBackward>)
output :  tensor([[205534.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(29868274., grad_fn=<MseLossBackward>)
output :  tensor([[168057.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3733e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194620.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(14610.7656, grad_fn=<MseLossBackward>)
output :  tensor([[114203.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(1447641.3750, grad_fn=<MseLossBackward>)
output :  tensor([[115660.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(9987229., grad_fn=<MseLossBackward>)
output :  tensor([[112665.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(442651.1250, grad_fn=<MseLossBackward>)
output :  tensor([[148602.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(3248443., grad_fn=<MseLossBackward>)
output :  tensor([[160999.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2994e+10, grad_fn=<MseLossBackward>)
output :  tensor([[180901.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(812195.2500, grad_fn=<MseLossBackward>)
output :  tensor([[128496.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(993370.3750, grad_fn=<MseLossBackward>)
output :  tensor([[146601.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2564201.7500, grad_fn=<MseLossBackward>)
output :  tensor([[180729.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1004e+09, grad_fn=<MseLossBackward>)
output :  tensor([[117977.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1160871.6250, grad_fn=<MseLossBackward>)
output :  tensor([[199328.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(5422058., grad_fn=<MseLossBackward>)
output :  tensor([[144547.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(204515.9375, grad_fn=<MseLossBackward>)
output :  tensor([[212565.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(111900.7031, grad_fn=<MseLossBackward>)
output :  tensor([[125738.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(68202.5859, grad_fn=<MseLossBackward>)
output :  tensor([[248229.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(9754.6484, grad_fn=<MseLossBackward>)
output :  tensor([[236538.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3485e+09, grad_fn=<MseLossBackward>)
output :  tensor([[147896.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7213e+08, grad_fn=<MseLossBackward>)
output :  tensor([[86163.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3322e+08, grad_fn=<MseLossBackward>)
output :  tensor([[191444.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9648e+09, grad_fn=<MseLossBackward>)
output :  tensor([[79792.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(1457471.3750, grad_fn=<MseLossBackward>)
output :  tensor([[137781.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2954423.7500, grad_fn=<MseLossBackward>)
output :  tensor([[77755.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(5085518.5000, grad_fn=<MseLossBackward>)
output :  tensor([[141518.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2056535.2500, grad_fn=<MseLossBackward>)
output :  tensor([[175442.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(311154.7812, grad_fn=<MseLossBackward>)
output :  tensor([[152501.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(997376.7500, grad_fn=<MseLossBackward>)
output :  tensor([[112667.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(27744334., grad_fn=<MseLossBackward>)
output :  tensor([[205251.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2210e+10, grad_fn=<MseLossBackward>)
output :  tensor([[130239.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(3025371., grad_fn=<MseLossBackward>)
output :  tensor([[266883.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7205e+08, grad_fn=<MseLossBackward>)
output :  tensor([[300866.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(83425392., grad_fn=<MseLossBackward>)
output :  tensor([[107076.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(179372.1094, grad_fn=<MseLossBackward>)
output :  tensor([[170216.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(5216299., grad_fn=<MseLossBackward>)
output :  tensor([[133994.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7571e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134219.]], grad_fn=<AddmmBackward>)
loss:  tensor(22857960., grad_fn=<MseLossBackward>)
output :  tensor([[124879.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(28843612., grad_fn=<MseLossBackward>)
output :  tensor([[124505.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(244483.8906, grad_fn=<MseLossBackward>)
output :  tensor([[136365.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2173e+08, grad_fn=<MseLossBackward>)
output :  tensor([[227077.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8386e+10, grad_fn=<MseLossBackward>)
output :  tensor([[188181.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3353e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144431.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(282924.2500, grad_fn=<MseLossBackward>)
output :  tensor([[126334.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(1359282.7500, grad_fn=<MseLossBackward>)
output :  tensor([[112153.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(815931.1250, grad_fn=<MseLossBackward>)
output :  tensor([[254201.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0781e+09, grad_fn=<MseLossBackward>)
output :  tensor([[133830.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1367328.2500, grad_fn=<MseLossBackward>)
output :  tensor([[200845.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(4642880., grad_fn=<MseLossBackward>)
output :  tensor([[103930.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(940748.4375, grad_fn=<MseLossBackward>)
output :  tensor([[136666.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(10780244., grad_fn=<MseLossBackward>)
output :  tensor([[209117.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3663e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181319.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2013871.3750, grad_fn=<MseLossBackward>)
output :  tensor([[187192.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(4808769.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162852.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1359e+10, grad_fn=<MseLossBackward>)
output :  tensor([[297013.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4430e+09, grad_fn=<MseLossBackward>)
output :  tensor([[197013.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(785522.1250, grad_fn=<MseLossBackward>)
output :  tensor([[261873.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9878e+10, grad_fn=<MseLossBackward>)
output :  tensor([[220020.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1141e+09, grad_fn=<MseLossBackward>)
output :  tensor([[283426.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1272e+09, grad_fn=<MseLossBackward>)
output :  tensor([[222011.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(3953573., grad_fn=<MseLossBackward>)
output :  tensor([[221249.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9156e+10, grad_fn=<MseLossBackward>)
output :  tensor([[197528.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(279081.0938, grad_fn=<MseLossBackward>)
output :  tensor([[158615.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7706e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131085.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2001650.2500, grad_fn=<MseLossBackward>)
output :  tensor([[138541.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(9250437., grad_fn=<MseLossBackward>)
output :  tensor([[91282.4922]], grad_fn=<AddmmBackward>)
loss:  tensor(79801.8359, grad_fn=<MseLossBackward>)
output :  tensor([[107033.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(934469.6250, grad_fn=<MseLossBackward>)
output :  tensor([[274124.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0004e+09, grad_fn=<MseLossBackward>)
output :  tensor([[239744.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(22510726., grad_fn=<MseLossBackward>)
output :  tensor([[147099.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(4407310., grad_fn=<MseLossBackward>)
output :  tensor([[139752.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(5073193., grad_fn=<MseLossBackward>)
output :  tensor([[174439.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(499186.4062, grad_fn=<MseLossBackward>)
output :  tensor([[152086.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(46737944., grad_fn=<MseLossBackward>)
output :  tensor([[162924.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9702e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165070.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(4965.8447, grad_fn=<MseLossBackward>)
output :  tensor([[135115.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(3552518.2500, grad_fn=<MseLossBackward>)
output :  tensor([[190106.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5706e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113528.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2337506.5000, grad_fn=<MseLossBackward>)
output :  tensor([[165519.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(42002348., grad_fn=<MseLossBackward>)
output :  tensor([[125714.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(32652832., grad_fn=<MseLossBackward>)
output :  tensor([[85594.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(1975847.5000, grad_fn=<MseLossBackward>)
output :  tensor([[179181.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(669354.0625, grad_fn=<MseLossBackward>)
output :  tensor([[111800.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(3612256.5000, grad_fn=<MseLossBackward>)
output :  tensor([[233048.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(35417376., grad_fn=<MseLossBackward>)
output :  tensor([[240754.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(18022810., grad_fn=<MseLossBackward>)
output :  tensor([[123669.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(33997828., grad_fn=<MseLossBackward>)
output :  tensor([[109159.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(40031.2578, grad_fn=<MseLossBackward>)
output :  tensor([[285546.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2985e+10, grad_fn=<MseLossBackward>)
output :  tensor([[171188.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(96954.3906, grad_fn=<MseLossBackward>)
output :  tensor([[123108.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(3576383.2500, grad_fn=<MseLossBackward>)
output :  tensor([[144474.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0089e+08, grad_fn=<MseLossBackward>)
output :  tensor([[200626.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7885e+08, grad_fn=<MseLossBackward>)
output :  tensor([[141842.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(710570., grad_fn=<MseLossBackward>)
output :  tensor([[159429.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4537e+10, grad_fn=<MseLossBackward>)
output :  tensor([[151553.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(5505035.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128603.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(804020.4375, grad_fn=<MseLossBackward>)
output :  tensor([[247161.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7250e+10, grad_fn=<MseLossBackward>)
output :  tensor([[400145.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(3439402., grad_fn=<MseLossBackward>)
output :  tensor([[108505.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(244862.6094, grad_fn=<MseLossBackward>)
output :  tensor([[117887.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(374620.5000, grad_fn=<MseLossBackward>)
output :  tensor([[159697.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(38839.7891, grad_fn=<MseLossBackward>)
output :  tensor([[132175.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7630e+08, grad_fn=<MseLossBackward>)
output :  tensor([[164380.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3200e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173672.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0542e+09, grad_fn=<MseLossBackward>)
output :  tensor([[101893.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2913795.7500, grad_fn=<MseLossBackward>)
output :  tensor([[141236.]], grad_fn=<AddmmBackward>)
loss:  tensor(55696., grad_fn=<MseLossBackward>)
output :  tensor([[362880.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(19482016., grad_fn=<MseLossBackward>)
output :  tensor([[204121.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4879e+09, grad_fn=<MseLossBackward>)
output :  tensor([[183163.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(58730908., grad_fn=<MseLossBackward>)
output :  tensor([[202231.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(446934.0312, grad_fn=<MseLossBackward>)
output :  tensor([[138967.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1041.0706, grad_fn=<MseLossBackward>)
output :  tensor([[200518.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(36218768., grad_fn=<MseLossBackward>)
output :  tensor([[135422.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7969e+08, grad_fn=<MseLossBackward>)
output :  tensor([[183136.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(4563631., grad_fn=<MseLossBackward>)
output :  tensor([[238768.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(10439866., grad_fn=<MseLossBackward>)
output :  tensor([[173196.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(645737.8125, grad_fn=<MseLossBackward>)
output :  tensor([[105718.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(5203103.5000, grad_fn=<MseLossBackward>)
output :  tensor([[263770.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(625483.2500, grad_fn=<MseLossBackward>)
output :  tensor([[246846.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(9943872., grad_fn=<MseLossBackward>)
output :  tensor([[121235.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3115114.7500, grad_fn=<MseLossBackward>)
output :  tensor([[218157.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2311e+09, grad_fn=<MseLossBackward>)
output :  tensor([[304181.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4599e+08, grad_fn=<MseLossBackward>)
output :  tensor([[209328.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(5421912., grad_fn=<MseLossBackward>)
output :  tensor([[217079.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5109e+10, grad_fn=<MseLossBackward>)
output :  tensor([[159440.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2373573.5000, grad_fn=<MseLossBackward>)
output :  tensor([[167729.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(5108942., grad_fn=<MseLossBackward>)
output :  tensor([[163112.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(38200704., grad_fn=<MseLossBackward>)
output :  tensor([[170456.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(208249.6250, grad_fn=<MseLossBackward>)
output :  tensor([[236656.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(9.8244e+08, grad_fn=<MseLossBackward>)
output :  tensor([[223192.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(39233976., grad_fn=<MseLossBackward>)
output :  tensor([[160776.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8979e+08, grad_fn=<MseLossBackward>)
output :  tensor([[124984.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(3938085.2500, grad_fn=<MseLossBackward>)
output :  tensor([[175897.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1216402.2500, grad_fn=<MseLossBackward>)
output :  tensor([[181879.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1029e+09, grad_fn=<MseLossBackward>)
output :  tensor([[207875.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4872e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134064.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(135079.2188, grad_fn=<MseLossBackward>)
output :  tensor([[151621.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(9.0130e+08, grad_fn=<MseLossBackward>)
output :  tensor([[271769.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(27360746., grad_fn=<MseLossBackward>)
output :  tensor([[87286.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(5227725., grad_fn=<MseLossBackward>)
output :  tensor([[236278.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(49235.4492, grad_fn=<MseLossBackward>)
output :  tensor([[261903.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0306e+11, grad_fn=<MseLossBackward>)
output :  tensor([[170659.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(434981.4688, grad_fn=<MseLossBackward>)
output :  tensor([[193795.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6978e+09, grad_fn=<MseLossBackward>)
output :  tensor([[153627.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1883670.5000, grad_fn=<MseLossBackward>)
output :  tensor([[206218.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0680e+09, grad_fn=<MseLossBackward>)
output :  tensor([[128584.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(172620.7812, grad_fn=<MseLossBackward>)
output :  tensor([[149470.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(19988724., grad_fn=<MseLossBackward>)
output :  tensor([[171168.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2187e+08, grad_fn=<MseLossBackward>)
output :  tensor([[186523.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(453581.2188, grad_fn=<MseLossBackward>)
output :  tensor([[128168.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(4703307., grad_fn=<MseLossBackward>)
output :  tensor([[139307.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(7883723.5000, grad_fn=<MseLossBackward>)
output :  tensor([[172669.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(109240.5781, grad_fn=<MseLossBackward>)
output :  tensor([[198813.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6200e+09, grad_fn=<MseLossBackward>)
output :  tensor([[239068.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(15457552., grad_fn=<MseLossBackward>)
output :  tensor([[155342.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(117102.9766, grad_fn=<MseLossBackward>)
output :  tensor([[199175.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(10081121., grad_fn=<MseLossBackward>)
output :  tensor([[163787.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9153e+08, grad_fn=<MseLossBackward>)
output :  tensor([[187533.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(64535112., grad_fn=<MseLossBackward>)
output :  tensor([[179145.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(569836.2500, grad_fn=<MseLossBackward>)
output :  tensor([[103728.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(45269872., grad_fn=<MseLossBackward>)
output :  tensor([[171725.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1723e+10, grad_fn=<MseLossBackward>)
output :  tensor([[133117.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(3544218., grad_fn=<MseLossBackward>)
output :  tensor([[121511.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(42401768., grad_fn=<MseLossBackward>)
output :  tensor([[175149.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1321961., grad_fn=<MseLossBackward>)
output :  tensor([[86950.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(3805517., grad_fn=<MseLossBackward>)
output :  tensor([[289830.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(28677.3047, grad_fn=<MseLossBackward>)
output :  tensor([[167539.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(6451044.5000, grad_fn=<MseLossBackward>)
output :  tensor([[191079.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0189e+10, grad_fn=<MseLossBackward>)
output :  tensor([[243594.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5109e+08, grad_fn=<MseLossBackward>)
output :  tensor([[151467.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(218702.3750, grad_fn=<MseLossBackward>)
output :  tensor([[125488.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2216702.2500, grad_fn=<MseLossBackward>)
output :  tensor([[118415.4922]], grad_fn=<AddmmBackward>)
loss:  tensor(2203763.5000, grad_fn=<MseLossBackward>)
output :  tensor([[143610.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1855e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174385.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(148489.8125, grad_fn=<MseLossBackward>)
output :  tensor([[112030.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7207e+08, grad_fn=<MseLossBackward>)
output :  tensor([[208222.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2051e+10, grad_fn=<MseLossBackward>)
output :  tensor([[231121.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0771e+08, grad_fn=<MseLossBackward>)
output :  tensor([[251361.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0687e+10, grad_fn=<MseLossBackward>)
output :  tensor([[222450.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7388e+08, grad_fn=<MseLossBackward>)
output :  tensor([[196312.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4206e+10, grad_fn=<MseLossBackward>)
output :  tensor([[190094.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(6732160., grad_fn=<MseLossBackward>)
output :  tensor([[207623.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7196e+10, grad_fn=<MseLossBackward>)
output :  tensor([[188706.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1695e+10, grad_fn=<MseLossBackward>)
output :  tensor([[175600.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(9859109., grad_fn=<MseLossBackward>)
output :  tensor([[151224.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(600770.3125, grad_fn=<MseLossBackward>)
output :  tensor([[335233.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(3120301.5000, grad_fn=<MseLossBackward>)
output :  tensor([[210867.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1281990., grad_fn=<MseLossBackward>)
output :  tensor([[161837.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(3377899.5000, grad_fn=<MseLossBackward>)
output :  tensor([[184560.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2421e+09, grad_fn=<MseLossBackward>)
output :  tensor([[109967.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(24672330., grad_fn=<MseLossBackward>)
output :  tensor([[275241.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8265e+10, grad_fn=<MseLossBackward>)
output :  tensor([[174458.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(311922.2500, grad_fn=<MseLossBackward>)
output :  tensor([[215511.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(4045063.7500, grad_fn=<MseLossBackward>)
output :  tensor([[208844.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4776e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179399.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(39831.4297, grad_fn=<MseLossBackward>)
output :  tensor([[201710.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(8060.6729, grad_fn=<MseLossBackward>)
output :  tensor([[154204.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(633193.1875, grad_fn=<MseLossBackward>)
output :  tensor([[147858.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2905e+09, grad_fn=<MseLossBackward>)
output :  tensor([[118892.]], grad_fn=<AddmmBackward>)
loss:  tensor(153664., grad_fn=<MseLossBackward>)
output :  tensor([[140861.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(742559.1875, grad_fn=<MseLossBackward>)
output :  tensor([[147194.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(3259491.7500, grad_fn=<MseLossBackward>)
output :  tensor([[201479.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6007e+10, grad_fn=<MseLossBackward>)
output :  tensor([[161569.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(4282636., grad_fn=<MseLossBackward>)
output :  tensor([[100837.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1790160.3750, grad_fn=<MseLossBackward>)
output :  tensor([[224188.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5001e+08, grad_fn=<MseLossBackward>)
output :  tensor([[185892.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1587e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176233.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(63173.6797, grad_fn=<MseLossBackward>)
output :  tensor([[84562.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(6565525.5000, grad_fn=<MseLossBackward>)
output :  tensor([[127671.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(685726.3125, grad_fn=<MseLossBackward>)
output :  tensor([[215872.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3505905.2500, grad_fn=<MseLossBackward>)
output :  tensor([[143232.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(589008.3125, grad_fn=<MseLossBackward>)
output :  tensor([[136877.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(47305380., grad_fn=<MseLossBackward>)
output :  tensor([[142462.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(18966.4531, grad_fn=<MseLossBackward>)
output :  tensor([[179067.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7278e+09, grad_fn=<MseLossBackward>)
output :  tensor([[142672.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1761260.7500, grad_fn=<MseLossBackward>)
output :  tensor([[159259.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(548247.6875, grad_fn=<MseLossBackward>)
output :  tensor([[216735.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(3012556.7500, grad_fn=<MseLossBackward>)
output :  tensor([[136495.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9198e+08, grad_fn=<MseLossBackward>)
output :  tensor([[256096.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1202963.3750, grad_fn=<MseLossBackward>)
output :  tensor([[155392.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(16871684., grad_fn=<MseLossBackward>)
output :  tensor([[129735.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(1527483.6250, grad_fn=<MseLossBackward>)
output :  tensor([[94731.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(72352.5938, grad_fn=<MseLossBackward>)
output :  tensor([[153184.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7175e+09, grad_fn=<MseLossBackward>)
output :  tensor([[178207.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2863445.7500, grad_fn=<MseLossBackward>)
output :  tensor([[121480.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(962223.0625, grad_fn=<MseLossBackward>)
output :  tensor([[189383.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5655e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146238.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4541e+09, grad_fn=<MseLossBackward>)
output :  tensor([[149511.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(150847.2812, grad_fn=<MseLossBackward>)
output :  tensor([[188596.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(717117.8750, grad_fn=<MseLossBackward>)
output :  tensor([[254448.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4921e+09, grad_fn=<MseLossBackward>)
output :  tensor([[94645.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(9895055., grad_fn=<MseLossBackward>)
output :  tensor([[239598.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(161541.1875, grad_fn=<MseLossBackward>)
output :  tensor([[127655.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(712612.9375, grad_fn=<MseLossBackward>)
output :  tensor([[166314.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9172e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113523.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8289e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176461.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(213342.9531, grad_fn=<MseLossBackward>)
output :  tensor([[164252.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1766e+08, grad_fn=<MseLossBackward>)
output :  tensor([[154344.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6856e+08, grad_fn=<MseLossBackward>)
output :  tensor([[236326.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(7146265.5000, grad_fn=<MseLossBackward>)
output :  tensor([[225554.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0527e+09, grad_fn=<MseLossBackward>)
output :  tensor([[125157.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(3393885., grad_fn=<MseLossBackward>)
output :  tensor([[127109.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(1230626.2500, grad_fn=<MseLossBackward>)
output :  tensor([[225337.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2764270., grad_fn=<MseLossBackward>)
output :  tensor([[230127.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(14994804., grad_fn=<MseLossBackward>)
output :  tensor([[225568.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1280292.2500, grad_fn=<MseLossBackward>)
output :  tensor([[147854.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(21043.1289, grad_fn=<MseLossBackward>)
output :  tensor([[203231.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(45809632., grad_fn=<MseLossBackward>)
output :  tensor([[130289.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0587e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135638.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(9848907., grad_fn=<MseLossBackward>)
output :  tensor([[308430.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(43162436., grad_fn=<MseLossBackward>)
output :  tensor([[141568.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(322908.0625, grad_fn=<MseLossBackward>)
output :  tensor([[123588.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2022e+09, grad_fn=<MseLossBackward>)
output :  tensor([[108418.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1168797.5000, grad_fn=<MseLossBackward>)
output :  tensor([[155819.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7824e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178968.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(9.1694e+09, grad_fn=<MseLossBackward>)
output :  tensor([[170413.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(6692245.5000, grad_fn=<MseLossBackward>)
output :  tensor([[194701.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(39668740., grad_fn=<MseLossBackward>)
output :  tensor([[104991.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(24916398., grad_fn=<MseLossBackward>)
output :  tensor([[174477.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(20452724., grad_fn=<MseLossBackward>)
output :  tensor([[164934.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(8794932., grad_fn=<MseLossBackward>)
output :  tensor([[139094.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(8888.9541, grad_fn=<MseLossBackward>)
output :  tensor([[261060.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6118e+09, grad_fn=<MseLossBackward>)
output :  tensor([[142366.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2910e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173637.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(406027.8125, grad_fn=<MseLossBackward>)
output :  tensor([[139430.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(324739.7188, grad_fn=<MseLossBackward>)
output :  tensor([[202451.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(3806827.7500, grad_fn=<MseLossBackward>)
output :  tensor([[168232.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(3124719., grad_fn=<MseLossBackward>)
output :  tensor([[242628.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1880926.5000, grad_fn=<MseLossBackward>)
output :  tensor([[137769.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(10691469., grad_fn=<MseLossBackward>)
output :  tensor([[150170.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(674015.3750, grad_fn=<MseLossBackward>)
output :  tensor([[212816.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(4766717., grad_fn=<MseLossBackward>)
output :  tensor([[166378.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1900951.5000, grad_fn=<MseLossBackward>)
output :  tensor([[196432.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(55236248., grad_fn=<MseLossBackward>)
output :  tensor([[133187.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6630e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129234.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(54891.3633, grad_fn=<MseLossBackward>)
output :  tensor([[139999.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(0.0881, grad_fn=<MseLossBackward>)
output :  tensor([[202850.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4422e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166617.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6643e+09, grad_fn=<MseLossBackward>)
output :  tensor([[74800.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1905e+08, grad_fn=<MseLossBackward>)
output :  tensor([[96753.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5015e+08, grad_fn=<MseLossBackward>)
output :  tensor([[252106.]], grad_fn=<AddmmBackward>)
loss:  tensor(1408969., grad_fn=<MseLossBackward>)
output :  tensor([[202787.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0688e+09, grad_fn=<MseLossBackward>)
output :  tensor([[114001.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(997595.1875, grad_fn=<MseLossBackward>)
output :  tensor([[159504.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8373e+08, grad_fn=<MseLossBackward>)
output :  tensor([[207247.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6262e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179835.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1297e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157541.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(6458110.5000, grad_fn=<MseLossBackward>)
output :  tensor([[170126.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(15883.8760, grad_fn=<MseLossBackward>)
output :  tensor([[117347.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(5510242.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163589.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(73772528., grad_fn=<MseLossBackward>)
output :  tensor([[192329.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1231e+08, grad_fn=<MseLossBackward>)
output :  tensor([[219830.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(109075.3828, grad_fn=<MseLossBackward>)
output :  tensor([[248616.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4640e+11, grad_fn=<MseLossBackward>)
output :  tensor([[152960.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(35532216., grad_fn=<MseLossBackward>)
output :  tensor([[111834.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(11255868., grad_fn=<MseLossBackward>)
output :  tensor([[168623.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7626e+08, grad_fn=<MseLossBackward>)
output :  tensor([[151946.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2093628.1250, grad_fn=<MseLossBackward>)
output :  tensor([[235392.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2584307.5000, grad_fn=<MseLossBackward>)
output :  tensor([[117009.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(4036897.2500, grad_fn=<MseLossBackward>)
output :  tensor([[181476.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2025062.3750, grad_fn=<MseLossBackward>)
output :  tensor([[188625.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(3706347., grad_fn=<MseLossBackward>)
output :  tensor([[163606.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4459e+10, grad_fn=<MseLossBackward>)
output :  tensor([[96344.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3546e+08, grad_fn=<MseLossBackward>)
output :  tensor([[246472.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(55845496., grad_fn=<MseLossBackward>)
output :  tensor([[178173.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(4723219.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138747.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1569265.1250, grad_fn=<MseLossBackward>)
output :  tensor([[234052.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(898437.3750, grad_fn=<MseLossBackward>)
output :  tensor([[168460.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(29816036., grad_fn=<MseLossBackward>)
output :  tensor([[202577.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4987e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134203.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(633690.6250, grad_fn=<MseLossBackward>)
output :  tensor([[186346.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9274e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136284.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(80958.0312, grad_fn=<MseLossBackward>)
output :  tensor([[228177.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(61193952., grad_fn=<MseLossBackward>)
output :  tensor([[226753.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4042e+08, grad_fn=<MseLossBackward>)
output :  tensor([[93239.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(10496942., grad_fn=<MseLossBackward>)
output :  tensor([[160085.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(424920.6562, grad_fn=<MseLossBackward>)
output :  tensor([[246912.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5367e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145055.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3035.3213, grad_fn=<MseLossBackward>)
output :  tensor([[110287.4922]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8738e+09, grad_fn=<MseLossBackward>)
output :  tensor([[165587.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1182350.3750, grad_fn=<MseLossBackward>)
output :  tensor([[146366.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(5600100.5000, grad_fn=<MseLossBackward>)
output :  tensor([[129659.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(2128703.7500, grad_fn=<MseLossBackward>)
output :  tensor([[189953.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7675e+09, grad_fn=<MseLossBackward>)
output :  tensor([[122943.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(196394.3906, grad_fn=<MseLossBackward>)
output :  tensor([[149978.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(4086209.5000, grad_fn=<MseLossBackward>)
output :  tensor([[167014.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(22426588., grad_fn=<MseLossBackward>)
output :  tensor([[152764.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(3112798.5000, grad_fn=<MseLossBackward>)
output :  tensor([[160957.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(3774399., grad_fn=<MseLossBackward>)
output :  tensor([[134806.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6598e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129882.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(4483773., grad_fn=<MseLossBackward>)
output :  tensor([[153707.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1632e+08, grad_fn=<MseLossBackward>)
output :  tensor([[145772.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2625412.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162359.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(371680.7500, grad_fn=<MseLossBackward>)
output :  tensor([[137945.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8654e+08, grad_fn=<MseLossBackward>)
output :  tensor([[151273.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(6116424.5000, grad_fn=<MseLossBackward>)
output :  tensor([[185235.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(7645052., grad_fn=<MseLossBackward>)
output :  tensor([[172372.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(11375337., grad_fn=<MseLossBackward>)
output :  tensor([[178478.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2314677., grad_fn=<MseLossBackward>)
output :  tensor([[220793.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(628972.9375, grad_fn=<MseLossBackward>)
output :  tensor([[106773.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1268439., grad_fn=<MseLossBackward>)
output :  tensor([[136739.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4017e+08, grad_fn=<MseLossBackward>)
output :  tensor([[286067.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(4539.3906, grad_fn=<MseLossBackward>)
output :  tensor([[116966.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(934877.5000, grad_fn=<MseLossBackward>)
output :  tensor([[175639.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9678e+09, grad_fn=<MseLossBackward>)
output :  tensor([[179190.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(33755736., grad_fn=<MseLossBackward>)
output :  tensor([[185867.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(135217.0781, grad_fn=<MseLossBackward>)
output :  tensor([[249948.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2757e+08, grad_fn=<MseLossBackward>)
output :  tensor([[222615.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(379359.7500, grad_fn=<MseLossBackward>)
output :  tensor([[126925.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4207e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175530.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0761e+08, grad_fn=<MseLossBackward>)
output :  tensor([[125155.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1335830.2500, grad_fn=<MseLossBackward>)
output :  tensor([[181921.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5976e+10, grad_fn=<MseLossBackward>)
output :  tensor([[149529.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(12045672., grad_fn=<MseLossBackward>)
output :  tensor([[154235.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(59841828., grad_fn=<MseLossBackward>)
output :  tensor([[206383.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(7042.8809, grad_fn=<MseLossBackward>)
output :  tensor([[144599.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4639e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174786.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1472354.7500, grad_fn=<MseLossBackward>)
output :  tensor([[253904.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5513e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148120.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(14415.0039, grad_fn=<MseLossBackward>)
output :  tensor([[202034.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(397471.1562, grad_fn=<MseLossBackward>)
output :  tensor([[164856.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(24076042., grad_fn=<MseLossBackward>)
output :  tensor([[125539.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4092e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136678.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(861503., grad_fn=<MseLossBackward>)
output :  tensor([[185670.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2790726.7500, grad_fn=<MseLossBackward>)
output :  tensor([[200568.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1169e+08, grad_fn=<MseLossBackward>)
output :  tensor([[231355.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3228e+09, grad_fn=<MseLossBackward>)
output :  tensor([[251196.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(33683876., grad_fn=<MseLossBackward>)
output :  tensor([[185910.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7713e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143387.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6923e+09, grad_fn=<MseLossBackward>)
output :  tensor([[139241.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(27647056., grad_fn=<MseLossBackward>)
output :  tensor([[71505.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9257e+08, grad_fn=<MseLossBackward>)
output :  tensor([[132144.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(8154951., grad_fn=<MseLossBackward>)
output :  tensor([[127378.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2314201.5000, grad_fn=<MseLossBackward>)
output :  tensor([[153170.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(688640.6250, grad_fn=<MseLossBackward>)
output :  tensor([[129893.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(8370986., grad_fn=<MseLossBackward>)
output :  tensor([[75688.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(659204.4375, grad_fn=<MseLossBackward>)
output :  tensor([[82881.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(777317.7500, grad_fn=<MseLossBackward>)
output :  tensor([[233122.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1259059.3750, grad_fn=<MseLossBackward>)
output :  tensor([[140753.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9825e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128663.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(3371096.7500, grad_fn=<MseLossBackward>)
output :  tensor([[169423.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(5875549., grad_fn=<MseLossBackward>)
output :  tensor([[237391.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(5721440., grad_fn=<MseLossBackward>)
output :  tensor([[190480.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2752644., grad_fn=<MseLossBackward>)
output :  tensor([[154964.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1071386.7500, grad_fn=<MseLossBackward>)
output :  tensor([[201063.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(10008622., grad_fn=<MseLossBackward>)
output :  tensor([[200251.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3505e+09, grad_fn=<MseLossBackward>)
output :  tensor([[135520.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2188319.2500, grad_fn=<MseLossBackward>)
output :  tensor([[152645.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(5545068.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135537.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(213516.1875, grad_fn=<MseLossBackward>)
output :  tensor([[198979.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6228e+08, grad_fn=<MseLossBackward>)
output :  tensor([[151585.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(5828980.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138106.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9897e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144503.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(157323.7812, grad_fn=<MseLossBackward>)
output :  tensor([[206248.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(33081370., grad_fn=<MseLossBackward>)
output :  tensor([[102559.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2269e+08, grad_fn=<MseLossBackward>)
output :  tensor([[167973.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(223995.1406, grad_fn=<MseLossBackward>)
output :  tensor([[130722.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(7410772.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145832.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1363165.7500, grad_fn=<MseLossBackward>)
output :  tensor([[105525.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8613e+09, grad_fn=<MseLossBackward>)
output :  tensor([[132026.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(29961596., grad_fn=<MseLossBackward>)
output :  tensor([[232701.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(10878247., grad_fn=<MseLossBackward>)
output :  tensor([[143494.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2266059.7500, grad_fn=<MseLossBackward>)
output :  tensor([[138558.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1120389.1250, grad_fn=<MseLossBackward>)
output :  tensor([[165406.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3993e+09, grad_fn=<MseLossBackward>)
output :  tensor([[267994.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0010e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175275.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(76132.8828, grad_fn=<MseLossBackward>)
output :  tensor([[104035.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1585356.3750, grad_fn=<MseLossBackward>)
output :  tensor([[202365.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6451e+09, grad_fn=<MseLossBackward>)
output :  tensor([[160993.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(3972734., grad_fn=<MseLossBackward>)
output :  tensor([[163122.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5926e+10, grad_fn=<MseLossBackward>)
output :  tensor([[101232.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(8601618., grad_fn=<MseLossBackward>)
output :  tensor([[121989.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2593660., grad_fn=<MseLossBackward>)
output :  tensor([[156368.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(135608.0625, grad_fn=<MseLossBackward>)
output :  tensor([[140864.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(748062.8125, grad_fn=<MseLossBackward>)
output :  tensor([[202040.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(4164915.7500, grad_fn=<MseLossBackward>)
output :  tensor([[142819.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(671247.3750, grad_fn=<MseLossBackward>)
output :  tensor([[260910.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1874717.2500, grad_fn=<MseLossBackward>)
output :  tensor([[129516.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3334e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164234.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1600501.7500, grad_fn=<MseLossBackward>)
output :  tensor([[188762.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(68750.4766, grad_fn=<MseLossBackward>)
output :  tensor([[123245.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7546e+08, grad_fn=<MseLossBackward>)
output :  tensor([[257426.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(55159632., grad_fn=<MseLossBackward>)
output :  tensor([[159281.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6830e+08, grad_fn=<MseLossBackward>)
output :  tensor([[243298.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(4207947., grad_fn=<MseLossBackward>)
output :  tensor([[143555.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(197524.6875, grad_fn=<MseLossBackward>)
output :  tensor([[208772.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1506717.8750, grad_fn=<MseLossBackward>)
output :  tensor([[176791.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(19285822., grad_fn=<MseLossBackward>)
output :  tensor([[153308.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(477610.5625, grad_fn=<MseLossBackward>)
output :  tensor([[116338.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(2761387., grad_fn=<MseLossBackward>)
output :  tensor([[241780.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0530e+09, grad_fn=<MseLossBackward>)
output :  tensor([[238671.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1764040.5000, grad_fn=<MseLossBackward>)
output :  tensor([[153756.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(175849.1875, grad_fn=<MseLossBackward>)
output :  tensor([[252253.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(7004624., grad_fn=<MseLossBackward>)
output :  tensor([[122830.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(69337368., grad_fn=<MseLossBackward>)
output :  tensor([[177720.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2959152.5000, grad_fn=<MseLossBackward>)
output :  tensor([[159330.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(447749.1875, grad_fn=<MseLossBackward>)
output :  tensor([[128241.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(7607426., grad_fn=<MseLossBackward>)
output :  tensor([[196186.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4471e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163428.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(326094.5312, grad_fn=<MseLossBackward>)
output :  tensor([[166925.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(15411881., grad_fn=<MseLossBackward>)
output :  tensor([[155857.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(4591980., grad_fn=<MseLossBackward>)
output :  tensor([[145802.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(16786562., grad_fn=<MseLossBackward>)
output :  tensor([[172468.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9650e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158195.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(3257404.5000, grad_fn=<MseLossBackward>)
output :  tensor([[381966.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(4014888.7500, grad_fn=<MseLossBackward>)
output :  tensor([[127420.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(176439.3750, grad_fn=<MseLossBackward>)
output :  tensor([[129430.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9299e+09, grad_fn=<MseLossBackward>)
output :  tensor([[277585.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(13160343., grad_fn=<MseLossBackward>)
output :  tensor([[158998.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(9007502., grad_fn=<MseLossBackward>)
output :  tensor([[131358.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1790e+08, grad_fn=<MseLossBackward>)
output :  tensor([[230263.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3013967.2500, grad_fn=<MseLossBackward>)
output :  tensor([[179080.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2016089.3750, grad_fn=<MseLossBackward>)
output :  tensor([[154487.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(6188045., grad_fn=<MseLossBackward>)
output :  tensor([[145607.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(369170.1562, grad_fn=<MseLossBackward>)
output :  tensor([[154577.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1250e+08, grad_fn=<MseLossBackward>)
output :  tensor([[100819.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(671682.6875, grad_fn=<MseLossBackward>)
output :  tensor([[76770.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8124e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163915.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1175869.1250, grad_fn=<MseLossBackward>)
output :  tensor([[188482.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5616e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161622.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(13120582., grad_fn=<MseLossBackward>)
output :  tensor([[154682.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(7937249.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135430.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(4078632.7500, grad_fn=<MseLossBackward>)
output :  tensor([[209629.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(13539755., grad_fn=<MseLossBackward>)
output :  tensor([[140403.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(5778089., grad_fn=<MseLossBackward>)
output :  tensor([[182695.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6207e+10, grad_fn=<MseLossBackward>)
output :  tensor([[147982.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3930430.2500, grad_fn=<MseLossBackward>)
output :  tensor([[111467.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1040e+08, grad_fn=<MseLossBackward>)
output :  tensor([[93006.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(987585.6250, grad_fn=<MseLossBackward>)
output :  tensor([[176061.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1126782.2500, grad_fn=<MseLossBackward>)
output :  tensor([[258781.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2618429.7500, grad_fn=<MseLossBackward>)
output :  tensor([[139582.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3676087.2500, grad_fn=<MseLossBackward>)
output :  tensor([[159492.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(161855.3438, grad_fn=<MseLossBackward>)
output :  tensor([[133023.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(274346.8125, grad_fn=<MseLossBackward>)
output :  tensor([[149093.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(165293.0625, grad_fn=<MseLossBackward>)
output :  tensor([[168210.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(96303.5469, grad_fn=<MseLossBackward>)
output :  tensor([[125830.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1367913., grad_fn=<MseLossBackward>)
output :  tensor([[172947.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8105e+08, grad_fn=<MseLossBackward>)
output :  tensor([[159149.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(4619208.5000, grad_fn=<MseLossBackward>)
output :  tensor([[118722.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(4940548., grad_fn=<MseLossBackward>)
output :  tensor([[161921.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0521e+09, grad_fn=<MseLossBackward>)
output :  tensor([[50973.7539]], grad_fn=<AddmmBackward>)
loss:  tensor(1053181., grad_fn=<MseLossBackward>)
output :  tensor([[235187.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9772e+09, grad_fn=<MseLossBackward>)
output :  tensor([[202465.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2148056.7500, grad_fn=<MseLossBackward>)
output :  tensor([[183669.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1769980.7500, grad_fn=<MseLossBackward>)
output :  tensor([[105343.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(430848.6562, grad_fn=<MseLossBackward>)
output :  tensor([[89088.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(4362191., grad_fn=<MseLossBackward>)
output :  tensor([[142753.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(7582709., grad_fn=<MseLossBackward>)
output :  tensor([[219670.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5249e+09, grad_fn=<MseLossBackward>)
output :  tensor([[203075.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(19573436., grad_fn=<MseLossBackward>)
output :  tensor([[171254.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(39118576., grad_fn=<MseLossBackward>)
output :  tensor([[172670.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5248e+09, grad_fn=<MseLossBackward>)
output :  tensor([[190125.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(15785.5664, grad_fn=<MseLossBackward>)
output :  tensor([[91494.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(20202708., grad_fn=<MseLossBackward>)
output :  tensor([[141064.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1132295.5000, grad_fn=<MseLossBackward>)
output :  tensor([[112638.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(4571177.5000, grad_fn=<MseLossBackward>)
output :  tensor([[147099.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2409e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173647.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8188e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195457.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(91051848., grad_fn=<MseLossBackward>)
output :  tensor([[179780.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(48050.0117, grad_fn=<MseLossBackward>)
output :  tensor([[96991.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(241480.1094, grad_fn=<MseLossBackward>)
output :  tensor([[117261.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(56684.9141, grad_fn=<MseLossBackward>)
output :  tensor([[160510.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5177e+08, grad_fn=<MseLossBackward>)
output :  tensor([[202167.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(4696160., grad_fn=<MseLossBackward>)
output :  tensor([[139311.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(21980274., grad_fn=<MseLossBackward>)
train_loss: [2.5951137e+09]
epoch_result tensor([0.])
output :  tensor([[157502.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(995910.4375, grad_fn=<MseLossBackward>)
output :  tensor([[122863.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(745794.1875, grad_fn=<MseLossBackward>)
output :  tensor([[195583.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1910744.6250, grad_fn=<MseLossBackward>)
output :  tensor([[179013.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(4053741.7500, grad_fn=<MseLossBackward>)
output :  tensor([[155024.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2786e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131183.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(10135568., grad_fn=<MseLossBackward>)
output :  tensor([[143807.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(7881881., grad_fn=<MseLossBackward>)
output :  tensor([[121555.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(6530261., grad_fn=<MseLossBackward>)
output :  tensor([[66824.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(69289760., grad_fn=<MseLossBackward>)
output :  tensor([[167442.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2080671., grad_fn=<MseLossBackward>)
output :  tensor([[134065.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(35214580., grad_fn=<MseLossBackward>)
output :  tensor([[227659.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(7075517., grad_fn=<MseLossBackward>)
output :  tensor([[167457.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(2380415., grad_fn=<MseLossBackward>)
output :  tensor([[249259.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(193696.2656, grad_fn=<MseLossBackward>)
output :  tensor([[53139.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3461344., grad_fn=<MseLossBackward>)
output :  tensor([[163402.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5732e+08, grad_fn=<MseLossBackward>)
output :  tensor([[185089.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0180e+08, grad_fn=<MseLossBackward>)
output :  tensor([[152895.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(12990843., grad_fn=<MseLossBackward>)
output :  tensor([[276243.]], grad_fn=<AddmmBackward>)
loss:  tensor(1545049., grad_fn=<MseLossBackward>)
output :  tensor([[195748.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1566682.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139828.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4350e+10, grad_fn=<MseLossBackward>)
output :  tensor([[193508.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(137606.2188, grad_fn=<MseLossBackward>)
output :  tensor([[180232.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9952e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151348.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(121724.6719, grad_fn=<MseLossBackward>)
output :  tensor([[176329.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(40060196., grad_fn=<MseLossBackward>)
output :  tensor([[81951.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(11895278., grad_fn=<MseLossBackward>)
output :  tensor([[170899.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3524e+09, grad_fn=<MseLossBackward>)
output :  tensor([[187013.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(4053490.2500, grad_fn=<MseLossBackward>)
output :  tensor([[204072.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6447e+09, grad_fn=<MseLossBackward>)
output :  tensor([[108577.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(2022995.1250, grad_fn=<MseLossBackward>)
output :  tensor([[170633.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(134299.3438, grad_fn=<MseLossBackward>)
output :  tensor([[138556.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(4227907., grad_fn=<MseLossBackward>)
output :  tensor([[130262.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1593038.3750, grad_fn=<MseLossBackward>)
output :  tensor([[117968.]], grad_fn=<AddmmBackward>)
loss:  tensor(2347024., grad_fn=<MseLossBackward>)
output :  tensor([[145740.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2602e+08, grad_fn=<MseLossBackward>)
output :  tensor([[169343.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1216e+10, grad_fn=<MseLossBackward>)
output :  tensor([[152485.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(7759445.5000, grad_fn=<MseLossBackward>)
output :  tensor([[178962.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1075531., grad_fn=<MseLossBackward>)
output :  tensor([[142839.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3384450., grad_fn=<MseLossBackward>)
output :  tensor([[107766.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1565e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136258.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2002e+09, grad_fn=<MseLossBackward>)
output :  tensor([[138759.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(14132078., grad_fn=<MseLossBackward>)
output :  tensor([[139127.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4707e+08, grad_fn=<MseLossBackward>)
output :  tensor([[225316.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(100261.2891, grad_fn=<MseLossBackward>)
output :  tensor([[132981.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(534658., grad_fn=<MseLossBackward>)
output :  tensor([[149453.]], grad_fn=<AddmmBackward>)
loss:  tensor(205209., grad_fn=<MseLossBackward>)
output :  tensor([[114249.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(5059020., grad_fn=<MseLossBackward>)
output :  tensor([[162675.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(7158969., grad_fn=<MseLossBackward>)
output :  tensor([[147856.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2225e+09, grad_fn=<MseLossBackward>)
output :  tensor([[191240.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(576270.7500, grad_fn=<MseLossBackward>)
output :  tensor([[134647.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(38833.6289, grad_fn=<MseLossBackward>)
output :  tensor([[111842.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(3393971.5000, grad_fn=<MseLossBackward>)
output :  tensor([[234009.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(95.6729, grad_fn=<MseLossBackward>)
output :  tensor([[165572.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2960e+09, grad_fn=<MseLossBackward>)
output :  tensor([[153474.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(30535468., grad_fn=<MseLossBackward>)
output :  tensor([[202390.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8937e+10, grad_fn=<MseLossBackward>)
output :  tensor([[248103.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1214e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143854.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(125769.9766, grad_fn=<MseLossBackward>)
output :  tensor([[135215.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1478390., grad_fn=<MseLossBackward>)
output :  tensor([[154332.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(445910.9375, grad_fn=<MseLossBackward>)
output :  tensor([[135798.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(33617348., grad_fn=<MseLossBackward>)
output :  tensor([[180077.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3876e+09, grad_fn=<MseLossBackward>)
output :  tensor([[181122.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(8865506., grad_fn=<MseLossBackward>)
output :  tensor([[160932.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(322446.5312, grad_fn=<MseLossBackward>)
output :  tensor([[138752.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(18044176., grad_fn=<MseLossBackward>)
output :  tensor([[142737.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(56584.5156, grad_fn=<MseLossBackward>)
output :  tensor([[148711.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(13774420., grad_fn=<MseLossBackward>)
output :  tensor([[174310.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2740e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194295.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1549e+08, grad_fn=<MseLossBackward>)
output :  tensor([[139124.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(6888164.5000, grad_fn=<MseLossBackward>)
output :  tensor([[170077.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(3322018.7500, grad_fn=<MseLossBackward>)
output :  tensor([[180953.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2128.9573, grad_fn=<MseLossBackward>)
output :  tensor([[117433.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(5922340.5000, grad_fn=<MseLossBackward>)
output :  tensor([[215133.]], grad_fn=<AddmmBackward>)
loss:  tensor(34421688., grad_fn=<MseLossBackward>)
output :  tensor([[180612.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(8335491., grad_fn=<MseLossBackward>)
output :  tensor([[127234.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3009140.7500, grad_fn=<MseLossBackward>)
output :  tensor([[194082.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(5846573., grad_fn=<MseLossBackward>)
output :  tensor([[173902.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(994040.1875, grad_fn=<MseLossBackward>)
output :  tensor([[210967.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0724e+10, grad_fn=<MseLossBackward>)
output :  tensor([[211171.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(29326.5625, grad_fn=<MseLossBackward>)
output :  tensor([[167088.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3024e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193151.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1817230.3750, grad_fn=<MseLossBackward>)
output :  tensor([[111777.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1495194., grad_fn=<MseLossBackward>)
output :  tensor([[114181.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2827705., grad_fn=<MseLossBackward>)
output :  tensor([[109959.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(4162907., grad_fn=<MseLossBackward>)
output :  tensor([[148102.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1697361.1250, grad_fn=<MseLossBackward>)
output :  tensor([[160011.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3354e+10, grad_fn=<MseLossBackward>)
output :  tensor([[178162.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(3377382.5000, grad_fn=<MseLossBackward>)
output :  tensor([[127594.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(9007.1963, grad_fn=<MseLossBackward>)
output :  tensor([[146134.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1287409.3750, grad_fn=<MseLossBackward>)
output :  tensor([[180261.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0576e+09, grad_fn=<MseLossBackward>)
output :  tensor([[116241.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(434003.0312, grad_fn=<MseLossBackward>)
output :  tensor([[194965.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(4140207.5000, grad_fn=<MseLossBackward>)
output :  tensor([[150856.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(34295116., grad_fn=<MseLossBackward>)
output :  tensor([[216842.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(15541705., grad_fn=<MseLossBackward>)
output :  tensor([[127106.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(1224394.1250, grad_fn=<MseLossBackward>)
output :  tensor([[248095.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(54085.3164, grad_fn=<MseLossBackward>)
output :  tensor([[237979.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2110e+09, grad_fn=<MseLossBackward>)
output :  tensor([[147913.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7269e+08, grad_fn=<MseLossBackward>)
output :  tensor([[86912.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7147e+08, grad_fn=<MseLossBackward>)
output :  tensor([[194272.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5008e+09, grad_fn=<MseLossBackward>)
output :  tensor([[83373.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(5632575., grad_fn=<MseLossBackward>)
output :  tensor([[142654.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(9952842., grad_fn=<MseLossBackward>)
output :  tensor([[77103.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2571663.2500, grad_fn=<MseLossBackward>)
output :  tensor([[144919.]], grad_fn=<AddmmBackward>)
loss:  tensor(3865156., grad_fn=<MseLossBackward>)
output :  tensor([[175483.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(266965.9688, grad_fn=<MseLossBackward>)
output :  tensor([[152854.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(417295.8125, grad_fn=<MseLossBackward>)
output :  tensor([[110097.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(7274609.5000, grad_fn=<MseLossBackward>)
output :  tensor([[203589.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2580e+10, grad_fn=<MseLossBackward>)
output :  tensor([[128134.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(133493.1875, grad_fn=<MseLossBackward>)
output :  tensor([[269910.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0180e+08, grad_fn=<MseLossBackward>)
output :  tensor([[298364.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3538e+08, grad_fn=<MseLossBackward>)
output :  tensor([[109173.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2802014.5000, grad_fn=<MseLossBackward>)
output :  tensor([[170401.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(4404292.5000, grad_fn=<MseLossBackward>)
output :  tensor([[132762.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1317e+08, grad_fn=<MseLossBackward>)
output :  tensor([[141652.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(7034347., grad_fn=<MseLossBackward>)
output :  tensor([[128495.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(3078325., grad_fn=<MseLossBackward>)
output :  tensor([[126074.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(1153593.5000, grad_fn=<MseLossBackward>)
output :  tensor([[134397.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1986e+08, grad_fn=<MseLossBackward>)
output :  tensor([[228547.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7812e+10, grad_fn=<MseLossBackward>)
output :  tensor([[188087.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3382e+10, grad_fn=<MseLossBackward>)
output :  tensor([[141926.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(3895134., grad_fn=<MseLossBackward>)
output :  tensor([[128192.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(479145.1562, grad_fn=<MseLossBackward>)
output :  tensor([[109713.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2361696.5000, grad_fn=<MseLossBackward>)
output :  tensor([[255727.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8854e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136625.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2641031.2500, grad_fn=<MseLossBackward>)
output :  tensor([[204697.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2881347., grad_fn=<MseLossBackward>)
output :  tensor([[109937.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(25377508., grad_fn=<MseLossBackward>)
output :  tensor([[138371.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2491415.5000, grad_fn=<MseLossBackward>)
output :  tensor([[208273.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6329e+08, grad_fn=<MseLossBackward>)
output :  tensor([[183574.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(13498391., grad_fn=<MseLossBackward>)
output :  tensor([[187329.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(5424605., grad_fn=<MseLossBackward>)
output :  tensor([[163701.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1112e+10, grad_fn=<MseLossBackward>)
output :  tensor([[299651.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2495e+09, grad_fn=<MseLossBackward>)
output :  tensor([[197011.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(789709.9375, grad_fn=<MseLossBackward>)
output :  tensor([[260772.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0189e+10, grad_fn=<MseLossBackward>)
output :  tensor([[222660.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8783e+09, grad_fn=<MseLossBackward>)
output :  tensor([[277647.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5486e+09, grad_fn=<MseLossBackward>)
output :  tensor([[225404.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1973454.2500, grad_fn=<MseLossBackward>)
output :  tensor([[224017.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8218e+10, grad_fn=<MseLossBackward>)
output :  tensor([[195238.]], grad_fn=<AddmmBackward>)
loss:  tensor(3104644., grad_fn=<MseLossBackward>)
output :  tensor([[158681.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8102e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133137.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(405788.9062, grad_fn=<MseLossBackward>)
output :  tensor([[133693.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3262877.7500, grad_fn=<MseLossBackward>)
output :  tensor([[90938.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(3744.8662, grad_fn=<MseLossBackward>)
output :  tensor([[107245.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(569258.4375, grad_fn=<MseLossBackward>)
output :  tensor([[273316.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0895e+09, grad_fn=<MseLossBackward>)
output :  tensor([[237120.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(4495791.5000, grad_fn=<MseLossBackward>)
output :  tensor([[143414.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2515197.7500, grad_fn=<MseLossBackward>)
output :  tensor([[136829.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(449067.5000, grad_fn=<MseLossBackward>)
output :  tensor([[175276.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2382778.2500, grad_fn=<MseLossBackward>)
output :  tensor([[146799.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2400708.2500, grad_fn=<MseLossBackward>)
output :  tensor([[166563.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8045e+08, grad_fn=<MseLossBackward>)
output :  tensor([[164729.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(73229.4375, grad_fn=<MseLossBackward>)
output :  tensor([[137665.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(443493.5625, grad_fn=<MseLossBackward>)
output :  tensor([[189696.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5153e+09, grad_fn=<MseLossBackward>)
output :  tensor([[110698.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(1693475.2500, grad_fn=<MseLossBackward>)
output :  tensor([[171163.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(699941.3750, grad_fn=<MseLossBackward>)
output :  tensor([[120958.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(918902., grad_fn=<MseLossBackward>)
output :  tensor([[87544.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(295970., grad_fn=<MseLossBackward>)
output :  tensor([[179400.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(359587.6250, grad_fn=<MseLossBackward>)
output :  tensor([[111387.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(2212261.2500, grad_fn=<MseLossBackward>)
output :  tensor([[238360.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(408600.6250, grad_fn=<MseLossBackward>)
output :  tensor([[246582.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2504652.5000, grad_fn=<MseLossBackward>)
output :  tensor([[132158.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(7069948.5000, grad_fn=<MseLossBackward>)
output :  tensor([[110467.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2275289.5000, grad_fn=<MseLossBackward>)
output :  tensor([[290896.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1391e+10, grad_fn=<MseLossBackward>)
output :  tensor([[176330.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(23335844., grad_fn=<MseLossBackward>)
output :  tensor([[126411.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(1991295.8750, grad_fn=<MseLossBackward>)
output :  tensor([[145665.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6540e+08, grad_fn=<MseLossBackward>)
output :  tensor([[200417.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8449e+08, grad_fn=<MseLossBackward>)
output :  tensor([[140903.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(9297.1777, grad_fn=<MseLossBackward>)
output :  tensor([[159491.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4522e+10, grad_fn=<MseLossBackward>)
output :  tensor([[159316.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(29341520., grad_fn=<MseLossBackward>)
output :  tensor([[130419.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(844647.1875, grad_fn=<MseLossBackward>)
output :  tensor([[245601.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7662e+10, grad_fn=<MseLossBackward>)
output :  tensor([[404772.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(7688836., grad_fn=<MseLossBackward>)
output :  tensor([[113905.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(24062704., grad_fn=<MseLossBackward>)
output :  tensor([[121954.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(11932545., grad_fn=<MseLossBackward>)
output :  tensor([[156422.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(9470622., grad_fn=<MseLossBackward>)
output :  tensor([[131874.]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8956e+08, grad_fn=<MseLossBackward>)
output :  tensor([[162927.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4895e+09, grad_fn=<MseLossBackward>)
output :  tensor([[171499.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7822e+09, grad_fn=<MseLossBackward>)
output :  tensor([[106851.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(10572659., grad_fn=<MseLossBackward>)
output :  tensor([[139761.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1534424.1250, grad_fn=<MseLossBackward>)
output :  tensor([[365814.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2190030., grad_fn=<MseLossBackward>)
output :  tensor([[207076.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2018e+09, grad_fn=<MseLossBackward>)
output :  tensor([[176129.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(395935.9062, grad_fn=<MseLossBackward>)
output :  tensor([[201783.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1246188.5000, grad_fn=<MseLossBackward>)
output :  tensor([[142913.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(15313281., grad_fn=<MseLossBackward>)
output :  tensor([[192676.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(3325209.2500, grad_fn=<MseLossBackward>)
output :  tensor([[137432.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(8.9594e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176238.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(22669800., grad_fn=<MseLossBackward>)
output :  tensor([[241013.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(972504.1250, grad_fn=<MseLossBackward>)
output :  tensor([[180578.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(43276456., grad_fn=<MseLossBackward>)
output :  tensor([[107451.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(300381.0625, grad_fn=<MseLossBackward>)
output :  tensor([[265836.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1626342.2500, grad_fn=<MseLossBackward>)
output :  tensor([[251582.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2505295.5000, grad_fn=<MseLossBackward>)
output :  tensor([[122711.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(83011.5156, grad_fn=<MseLossBackward>)
output :  tensor([[217956.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2540e+09, grad_fn=<MseLossBackward>)
output :  tensor([[303133.]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9138e+08, grad_fn=<MseLossBackward>)
output :  tensor([[207965.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(932703.2500, grad_fn=<MseLossBackward>)
output :  tensor([[213818.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5922e+10, grad_fn=<MseLossBackward>)
output :  tensor([[159197.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1682573.7500, grad_fn=<MseLossBackward>)
output :  tensor([[174668.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(21883976., grad_fn=<MseLossBackward>)
output :  tensor([[160222.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(10829755., grad_fn=<MseLossBackward>)
output :  tensor([[173303.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(10912493., grad_fn=<MseLossBackward>)
output :  tensor([[234702.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1087e+09, grad_fn=<MseLossBackward>)
output :  tensor([[218167.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2744e+08, grad_fn=<MseLossBackward>)
output :  tensor([[161562.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1208e+08, grad_fn=<MseLossBackward>)
output :  tensor([[120869.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(4538131.5000, grad_fn=<MseLossBackward>)
output :  tensor([[178021.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1043621.8750, grad_fn=<MseLossBackward>)
output :  tensor([[181497.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1627e+09, grad_fn=<MseLossBackward>)
output :  tensor([[208758.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4543e+10, grad_fn=<MseLossBackward>)
output :  tensor([[136795.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(5586575.5000, grad_fn=<MseLossBackward>)
output :  tensor([[150335.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2572e+08, grad_fn=<MseLossBackward>)
output :  tensor([[274832.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(4697108., grad_fn=<MseLossBackward>)
output :  tensor([[90947.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(35374520., grad_fn=<MseLossBackward>)
output :  tensor([[236800.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(90159.4453, grad_fn=<MseLossBackward>)
output :  tensor([[257645.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0581e+11, grad_fn=<MseLossBackward>)
output :  tensor([[171062.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1128142.7500, grad_fn=<MseLossBackward>)
output :  tensor([[193378.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7324e+09, grad_fn=<MseLossBackward>)
output :  tensor([[154819.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(32642.3262, grad_fn=<MseLossBackward>)
output :  tensor([[205761.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1266e+09, grad_fn=<MseLossBackward>)
output :  tensor([[131110.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(4454606., grad_fn=<MseLossBackward>)
output :  tensor([[145582.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(339852.5625, grad_fn=<MseLossBackward>)
output :  tensor([[169492.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2858e+08, grad_fn=<MseLossBackward>)
output :  tensor([[185139.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(505165.5625, grad_fn=<MseLossBackward>)
output :  tensor([[128413.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(5825585.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139521.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(9131445., grad_fn=<MseLossBackward>)
output :  tensor([[176783.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(14318183., grad_fn=<MseLossBackward>)
output :  tensor([[197897.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7147e+09, grad_fn=<MseLossBackward>)
output :  tensor([[239160.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(14741760., grad_fn=<MseLossBackward>)
output :  tensor([[154062.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(879111.3125, grad_fn=<MseLossBackward>)
output :  tensor([[196771.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(594609.6875, grad_fn=<MseLossBackward>)
output :  tensor([[164472.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1914e+08, grad_fn=<MseLossBackward>)
output :  tensor([[187065.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(57241992., grad_fn=<MseLossBackward>)
output :  tensor([[183621.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(13850958., grad_fn=<MseLossBackward>)
output :  tensor([[98111.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1235988., grad_fn=<MseLossBackward>)
output :  tensor([[172036.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1656e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134771.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(52126.5977, grad_fn=<MseLossBackward>)
output :  tensor([[121154.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(37873160., grad_fn=<MseLossBackward>)
output :  tensor([[172865.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1287232.1250, grad_fn=<MseLossBackward>)
output :  tensor([[84701.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(89008.9922, grad_fn=<MseLossBackward>)
output :  tensor([[288568.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2049550.1250, grad_fn=<MseLossBackward>)
output :  tensor([[171186.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(38268724., grad_fn=<MseLossBackward>)
output :  tensor([[190847.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0255e+10, grad_fn=<MseLossBackward>)
output :  tensor([[247115.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7045e+08, grad_fn=<MseLossBackward>)
output :  tensor([[152462.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2137489.7500, grad_fn=<MseLossBackward>)
output :  tensor([[122451.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(2398070., grad_fn=<MseLossBackward>)
output :  tensor([[125541.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(31823438., grad_fn=<MseLossBackward>)
output :  tensor([[143683.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2276e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174098.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(9671.4932, grad_fn=<MseLossBackward>)
output :  tensor([[110337.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7495e+08, grad_fn=<MseLossBackward>)
output :  tensor([[209841.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1698e+10, grad_fn=<MseLossBackward>)
output :  tensor([[231823.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(93633744., grad_fn=<MseLossBackward>)
output :  tensor([[251298.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0705e+10, grad_fn=<MseLossBackward>)
output :  tensor([[219566.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7766e+08, grad_fn=<MseLossBackward>)
output :  tensor([[194651.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4604e+10, grad_fn=<MseLossBackward>)
output :  tensor([[187435.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(4184.4727, grad_fn=<MseLossBackward>)
output :  tensor([[205662.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8052e+10, grad_fn=<MseLossBackward>)
output :  tensor([[189326.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1513e+10, grad_fn=<MseLossBackward>)
output :  tensor([[179624.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(782036.2500, grad_fn=<MseLossBackward>)
output :  tensor([[155044.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(9266602., grad_fn=<MseLossBackward>)
output :  tensor([[337288.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(83502.9375, grad_fn=<MseLossBackward>)
output :  tensor([[213022.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1044707.5625, grad_fn=<MseLossBackward>)
output :  tensor([[160996.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(993853.2500, grad_fn=<MseLossBackward>)
output :  tensor([[187324.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9350e+09, grad_fn=<MseLossBackward>)
output :  tensor([[103408.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2532474.5000, grad_fn=<MseLossBackward>)
output :  tensor([[270223.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1098e+10, grad_fn=<MseLossBackward>)
output :  tensor([[168635.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(27711176., grad_fn=<MseLossBackward>)
output :  tensor([[212494.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1010339.0625, grad_fn=<MseLossBackward>)
output :  tensor([[209443.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3354e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179566.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(134207.7500, grad_fn=<MseLossBackward>)
output :  tensor([[196725.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(25749124., grad_fn=<MseLossBackward>)
output :  tensor([[159611.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(21267086., grad_fn=<MseLossBackward>)
output :  tensor([[147941.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2984e+09, grad_fn=<MseLossBackward>)
output :  tensor([[116202.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(5277070.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140730.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(532991.2500, grad_fn=<MseLossBackward>)
output :  tensor([[148099.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(810112.5000, grad_fn=<MseLossBackward>)
output :  tensor([[202754.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5686e+10, grad_fn=<MseLossBackward>)
output :  tensor([[161412.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(3656401.2500, grad_fn=<MseLossBackward>)
output :  tensor([[100250.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(562781.3125, grad_fn=<MseLossBackward>)
output :  tensor([[224806.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3083e+08, grad_fn=<MseLossBackward>)
output :  tensor([[184029.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4335e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175383.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1213233.3750, grad_fn=<MseLossBackward>)
output :  tensor([[80520.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2187579.7500, grad_fn=<MseLossBackward>)
output :  tensor([[128130.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(136611.0938, grad_fn=<MseLossBackward>)
output :  tensor([[209900.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(16804620., grad_fn=<MseLossBackward>)
output :  tensor([[143162.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(701641.8125, grad_fn=<MseLossBackward>)
output :  tensor([[129682.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(101024.6484, grad_fn=<MseLossBackward>)
output :  tensor([[145584.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(8905468., grad_fn=<MseLossBackward>)
output :  tensor([[177644.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6116e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145699.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2887344.2500, grad_fn=<MseLossBackward>)
output :  tensor([[161119.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1252475.7500, grad_fn=<MseLossBackward>)
output :  tensor([[213451.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2397174.7500, grad_fn=<MseLossBackward>)
output :  tensor([[137750.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0726e+09, grad_fn=<MseLossBackward>)
output :  tensor([[254462.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(288536.8438, grad_fn=<MseLossBackward>)
output :  tensor([[160136.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(405132.2500, grad_fn=<MseLossBackward>)
output :  tensor([[128772.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(74090.2891, grad_fn=<MseLossBackward>)
output :  tensor([[96903.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(3622152.5000, grad_fn=<MseLossBackward>)
output :  tensor([[154332.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8766e+09, grad_fn=<MseLossBackward>)
output :  tensor([[180090.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(36123.7539, grad_fn=<MseLossBackward>)
output :  tensor([[121339.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(704511.0625, grad_fn=<MseLossBackward>)
output :  tensor([[188226.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6584e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144867.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2729e+09, grad_fn=<MseLossBackward>)
output :  tensor([[149171.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(530393.5625, grad_fn=<MseLossBackward>)
output :  tensor([[188394.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(414836.6250, grad_fn=<MseLossBackward>)
output :  tensor([[250043.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8519e+09, grad_fn=<MseLossBackward>)
output :  tensor([[89433.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(4268905., grad_fn=<MseLossBackward>)
output :  tensor([[237547.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(6014986., grad_fn=<MseLossBackward>)
output :  tensor([[129034.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(285999.3438, grad_fn=<MseLossBackward>)
output :  tensor([[165268.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0127e+10, grad_fn=<MseLossBackward>)
output :  tensor([[113585.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8456e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174652.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1815419.3750, grad_fn=<MseLossBackward>)
output :  tensor([[164160.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1307e+08, grad_fn=<MseLossBackward>)
output :  tensor([[156649.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8380e+08, grad_fn=<MseLossBackward>)
output :  tensor([[238475.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(274608.7500, grad_fn=<MseLossBackward>)
output :  tensor([[227640.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2171e+08, grad_fn=<MseLossBackward>)
output :  tensor([[127409.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(167946.2812, grad_fn=<MseLossBackward>)
output :  tensor([[125760.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(57225.6094, grad_fn=<MseLossBackward>)
output :  tensor([[224348.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(7031529.5000, grad_fn=<MseLossBackward>)
output :  tensor([[232887.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1237273.8750, grad_fn=<MseLossBackward>)
output :  tensor([[225866.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(694201.4375, grad_fn=<MseLossBackward>)
output :  tensor([[147774.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(51061.8750, grad_fn=<MseLossBackward>)
output :  tensor([[208742.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1582092.2500, grad_fn=<MseLossBackward>)
output :  tensor([[127762.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(60253616., grad_fn=<MseLossBackward>)
output :  tensor([[133210.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(504166.5625, grad_fn=<MseLossBackward>)
output :  tensor([[312424.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(6633522., grad_fn=<MseLossBackward>)
output :  tensor([[138938.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(4248236.5000, grad_fn=<MseLossBackward>)
output :  tensor([[121935.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0179e+09, grad_fn=<MseLossBackward>)
output :  tensor([[108278.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(1491470.6250, grad_fn=<MseLossBackward>)
output :  tensor([[154571.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2143e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181861.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(8.6236e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173118.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(13927.6875, grad_fn=<MseLossBackward>)
output :  tensor([[191545.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(89389936., grad_fn=<MseLossBackward>)
output :  tensor([[101621.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(2628679.5000, grad_fn=<MseLossBackward>)
output :  tensor([[179144.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(20902.8340, grad_fn=<MseLossBackward>)
output :  tensor([[167030.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(755704.2500, grad_fn=<MseLossBackward>)
output :  tensor([[136843.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4652581.5000, grad_fn=<MseLossBackward>)
output :  tensor([[260346.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(9.7523e+09, grad_fn=<MseLossBackward>)
output :  tensor([[141490.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1912e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173639.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(408820.3750, grad_fn=<MseLossBackward>)
output :  tensor([[139921.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(6216.3369, grad_fn=<MseLossBackward>)
output :  tensor([[200774.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(75530.5000, grad_fn=<MseLossBackward>)
output :  tensor([[166166.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(14695483., grad_fn=<MseLossBackward>)
output :  tensor([[240264.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(13950925., grad_fn=<MseLossBackward>)
output :  tensor([[134323.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(31323.4688, grad_fn=<MseLossBackward>)
output :  tensor([[149571.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(48965.3906, grad_fn=<MseLossBackward>)
output :  tensor([[214214.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(617771.4375, grad_fn=<MseLossBackward>)
output :  tensor([[161851.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(9911576., grad_fn=<MseLossBackward>)
output :  tensor([[192589.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(12887876., grad_fn=<MseLossBackward>)
output :  tensor([[131628.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4921e+08, grad_fn=<MseLossBackward>)
output :  tensor([[125630.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(11350740., grad_fn=<MseLossBackward>)
output :  tensor([[141959.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(3839334., grad_fn=<MseLossBackward>)
output :  tensor([[200817.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7173e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164860.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4861e+09, grad_fn=<MseLossBackward>)
output :  tensor([[75791.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4936e+08, grad_fn=<MseLossBackward>)
output :  tensor([[94808.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0626e+08, grad_fn=<MseLossBackward>)
output :  tensor([[261818.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(72686816., grad_fn=<MseLossBackward>)
output :  tensor([[204432.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2814e+09, grad_fn=<MseLossBackward>)
output :  tensor([[116382.1016]], grad_fn=<AddmmBackward>)
loss:  tensor(1910204.7500, grad_fn=<MseLossBackward>)
output :  tensor([[157604.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(8.9377e+08, grad_fn=<MseLossBackward>)
output :  tensor([[206759.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7530e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180715.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9718e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157677.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(7167416.5000, grad_fn=<MseLossBackward>)
output :  tensor([[168886.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1239116.8750, grad_fn=<MseLossBackward>)
output :  tensor([[114114.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(784539.2500, grad_fn=<MseLossBackward>)
output :  tensor([[160961.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(35533892., grad_fn=<MseLossBackward>)
output :  tensor([[191481.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3772e+08, grad_fn=<MseLossBackward>)
output :  tensor([[216336.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(10009017., grad_fn=<MseLossBackward>)
output :  tensor([[243347.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5166e+11, grad_fn=<MseLossBackward>)
output :  tensor([[149079.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(4322371., grad_fn=<MseLossBackward>)
output :  tensor([[109013.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(284180.6250, grad_fn=<MseLossBackward>)
output :  tensor([[169317.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5832e+08, grad_fn=<MseLossBackward>)
output :  tensor([[150053.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(199767.0938, grad_fn=<MseLossBackward>)
output :  tensor([[240338.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(11142870., grad_fn=<MseLossBackward>)
output :  tensor([[115560.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(314107.7188, grad_fn=<MseLossBackward>)
output :  tensor([[180837.]], grad_fn=<AddmmBackward>)
loss:  tensor(4255969., grad_fn=<MseLossBackward>)
output :  tensor([[183003.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(13663188., grad_fn=<MseLossBackward>)
output :  tensor([[163662.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4441e+10, grad_fn=<MseLossBackward>)
output :  tensor([[97523.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7302e+08, grad_fn=<MseLossBackward>)
output :  tensor([[239561.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(314878.8125, grad_fn=<MseLossBackward>)
output :  tensor([[177180.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1394355., grad_fn=<MseLossBackward>)
output :  tensor([[142269.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(5150843., grad_fn=<MseLossBackward>)
output :  tensor([[239023.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(16189558., grad_fn=<MseLossBackward>)
output :  tensor([[162618.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(145542.2500, grad_fn=<MseLossBackward>)
output :  tensor([[202714.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4954e+10, grad_fn=<MseLossBackward>)
output :  tensor([[135907.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(823811.5000, grad_fn=<MseLossBackward>)
output :  tensor([[185456.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5022e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136999.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(999093.9375, grad_fn=<MseLossBackward>)
output :  tensor([[229620.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(40694832., grad_fn=<MseLossBackward>)
output :  tensor([[226710.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4238e+08, grad_fn=<MseLossBackward>)
output :  tensor([[91077.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1161545., grad_fn=<MseLossBackward>)
output :  tensor([[162003.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(6602731.5000, grad_fn=<MseLossBackward>)
output :  tensor([[244929.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5863e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145391.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(152905.4375, grad_fn=<MseLossBackward>)
output :  tensor([[108801.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7473e+09, grad_fn=<MseLossBackward>)
output :  tensor([[162050.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(5998749., grad_fn=<MseLossBackward>)
output :  tensor([[146088.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(4360984., grad_fn=<MseLossBackward>)
output :  tensor([[129353.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1330634.3750, grad_fn=<MseLossBackward>)
output :  tensor([[190217.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7311e+09, grad_fn=<MseLossBackward>)
output :  tensor([[123441.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(886981.3750, grad_fn=<MseLossBackward>)
output :  tensor([[152508.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(258762.9688, grad_fn=<MseLossBackward>)
output :  tensor([[169225.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(6370970.5000, grad_fn=<MseLossBackward>)
output :  tensor([[148782.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(4919039., grad_fn=<MseLossBackward>)
output :  tensor([[159982.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(8514359., grad_fn=<MseLossBackward>)
output :  tensor([[135192.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8603e+08, grad_fn=<MseLossBackward>)
output :  tensor([[132009.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(98.7539, grad_fn=<MseLossBackward>)
output :  tensor([[155989.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8863e+08, grad_fn=<MseLossBackward>)
output :  tensor([[144747.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(354676.0938, grad_fn=<MseLossBackward>)
output :  tensor([[162174.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(180160.4531, grad_fn=<MseLossBackward>)
output :  tensor([[139204.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5876e+08, grad_fn=<MseLossBackward>)
output :  tensor([[149038.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(56740.7305, grad_fn=<MseLossBackward>)
output :  tensor([[185999.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(4000125., grad_fn=<MseLossBackward>)
output :  tensor([[168840.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(25505.0879, grad_fn=<MseLossBackward>)
output :  tensor([[177940.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(4239545.5000, grad_fn=<MseLossBackward>)
output :  tensor([[220485.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(235346.2656, grad_fn=<MseLossBackward>)
output :  tensor([[112974.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(25748806., grad_fn=<MseLossBackward>)
output :  tensor([[138527.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8570e+08, grad_fn=<MseLossBackward>)
output :  tensor([[281400.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(21157988., grad_fn=<MseLossBackward>)
output :  tensor([[118076.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(4312014.5000, grad_fn=<MseLossBackward>)
output :  tensor([[175808.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9529e+09, grad_fn=<MseLossBackward>)
output :  tensor([[185274.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(75453.2188, grad_fn=<MseLossBackward>)
output :  tensor([[170871.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1400e+08, grad_fn=<MseLossBackward>)
output :  tensor([[250626.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9408e+08, grad_fn=<MseLossBackward>)
output :  tensor([[221245.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(569175.9375, grad_fn=<MseLossBackward>)
output :  tensor([[127254.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5602e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176002.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2913e+08, grad_fn=<MseLossBackward>)
output :  tensor([[124669.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(447571.4688, grad_fn=<MseLossBackward>)
output :  tensor([[182806.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5522e+10, grad_fn=<MseLossBackward>)
output :  tensor([[156164.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(10011390., grad_fn=<MseLossBackward>)
output :  tensor([[154776.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(68494760., grad_fn=<MseLossBackward>)
output :  tensor([[205403.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(804328.6875, grad_fn=<MseLossBackward>)
output :  tensor([[145964.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8129e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175079.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(846572.5000, grad_fn=<MseLossBackward>)
output :  tensor([[252094.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5104e+08, grad_fn=<MseLossBackward>)
output :  tensor([[146544.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2118116.5000, grad_fn=<MseLossBackward>)
output :  tensor([[202421.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(59368.3672, grad_fn=<MseLossBackward>)
output :  tensor([[163171.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(10376653., grad_fn=<MseLossBackward>)
output :  tensor([[122709.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2048e+09, grad_fn=<MseLossBackward>)
output :  tensor([[133546.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(4854930., grad_fn=<MseLossBackward>)
output :  tensor([[181299.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(7290928., grad_fn=<MseLossBackward>)
output :  tensor([[195432.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(29506794., grad_fn=<MseLossBackward>)
output :  tensor([[224460.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1653e+09, grad_fn=<MseLossBackward>)
output :  tensor([[253855.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(9886799., grad_fn=<MseLossBackward>)
output :  tensor([[188076.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7141e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143594.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7139e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144740.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(57847.7656, grad_fn=<MseLossBackward>)
output :  tensor([[71580.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9730e+08, grad_fn=<MseLossBackward>)
output :  tensor([[140991.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(35894140., grad_fn=<MseLossBackward>)
output :  tensor([[132607.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(13749032., grad_fn=<MseLossBackward>)
output :  tensor([[156402.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(5773958.5000, grad_fn=<MseLossBackward>)
output :  tensor([[125170.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3347928., grad_fn=<MseLossBackward>)
output :  tensor([[76807.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(94599.5000, grad_fn=<MseLossBackward>)
output :  tensor([[84828.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(7999263., grad_fn=<MseLossBackward>)
output :  tensor([[220298.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3693e+08, grad_fn=<MseLossBackward>)
output :  tensor([[140648.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9236e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131334.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(695712.3750, grad_fn=<MseLossBackward>)
output :  tensor([[171622.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(21363172., grad_fn=<MseLossBackward>)
output :  tensor([[232214.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(7760229., grad_fn=<MseLossBackward>)
output :  tensor([[187715.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(19578412., grad_fn=<MseLossBackward>)
output :  tensor([[156531.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(282243.1562, grad_fn=<MseLossBackward>)
output :  tensor([[198087.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(35097.6797, grad_fn=<MseLossBackward>)
output :  tensor([[203092.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1497e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136782.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(47462.7070, grad_fn=<MseLossBackward>)
output :  tensor([[154137.]], grad_fn=<AddmmBackward>)
loss:  tensor(744769., grad_fn=<MseLossBackward>)
output :  tensor([[137643.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2699705.7500, grad_fn=<MseLossBackward>)
output :  tensor([[199040.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(9.5848e+08, grad_fn=<MseLossBackward>)
output :  tensor([[154496.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(246310.5938, grad_fn=<MseLossBackward>)
output :  tensor([[136783.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8735e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150566.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(32110816., grad_fn=<MseLossBackward>)
output :  tensor([[209064.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(8617986., grad_fn=<MseLossBackward>)
output :  tensor([[104050.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8624e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163059.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(19719428., grad_fn=<MseLossBackward>)
output :  tensor([[129533.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(2350879.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144247.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(7576858.5000, grad_fn=<MseLossBackward>)
output :  tensor([[102839.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6367e+09, grad_fn=<MseLossBackward>)
output :  tensor([[140016.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(6335210.5000, grad_fn=<MseLossBackward>)
output :  tensor([[237993.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3972173.5000, grad_fn=<MseLossBackward>)
output :  tensor([[146016.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1032510., grad_fn=<MseLossBackward>)
output :  tensor([[138364.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(747711.5000, grad_fn=<MseLossBackward>)
output :  tensor([[164561.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3367e+09, grad_fn=<MseLossBackward>)
output :  tensor([[268643.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(87541168., grad_fn=<MseLossBackward>)
output :  tensor([[173776.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1496455.2500, grad_fn=<MseLossBackward>)
output :  tensor([[102517.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(66660.7812, grad_fn=<MseLossBackward>)
output :  tensor([[203724.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4428e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158256.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(553443., grad_fn=<MseLossBackward>)
output :  tensor([[162198.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6323e+10, grad_fn=<MseLossBackward>)
output :  tensor([[97583.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(513629.7812, grad_fn=<MseLossBackward>)
output :  tensor([[126464.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(8207285., grad_fn=<MseLossBackward>)
output :  tensor([[157180.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1393543.3750, grad_fn=<MseLossBackward>)
output :  tensor([[139819.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(32433.7578, grad_fn=<MseLossBackward>)
output :  tensor([[201467.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2152593.2500, grad_fn=<MseLossBackward>)
output :  tensor([[143525.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2328199.2500, grad_fn=<MseLossBackward>)
output :  tensor([[265186.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(8445744., grad_fn=<MseLossBackward>)
output :  tensor([[128610.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2681e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164100.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1958381.6250, grad_fn=<MseLossBackward>)
output :  tensor([[190291.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3211208., grad_fn=<MseLossBackward>)
output :  tensor([[124539.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1139e+08, grad_fn=<MseLossBackward>)
output :  tensor([[249328.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(451059.1562, grad_fn=<MseLossBackward>)
output :  tensor([[158145.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3258e+08, grad_fn=<MseLossBackward>)
output :  tensor([[244445.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(818827.0625, grad_fn=<MseLossBackward>)
output :  tensor([[147686.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(13589821., grad_fn=<MseLossBackward>)
output :  tensor([[209400.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(359606.3438, grad_fn=<MseLossBackward>)
output :  tensor([[178753.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(40364380., grad_fn=<MseLossBackward>)
output :  tensor([[155184.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1401893., grad_fn=<MseLossBackward>)
output :  tensor([[123459.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(29806310., grad_fn=<MseLossBackward>)
output :  tensor([[240059.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2118e+09, grad_fn=<MseLossBackward>)
output :  tensor([[234872.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(26292858., grad_fn=<MseLossBackward>)
output :  tensor([[152519.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(668101.8750, grad_fn=<MseLossBackward>)
output :  tensor([[257096.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(4824887., grad_fn=<MseLossBackward>)
output :  tensor([[124334.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(96639808., grad_fn=<MseLossBackward>)
output :  tensor([[176709.]], grad_fn=<AddmmBackward>)
loss:  tensor(502681., grad_fn=<MseLossBackward>)
output :  tensor([[160336.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(113064.0625, grad_fn=<MseLossBackward>)
output :  tensor([[130123.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(769060.5000, grad_fn=<MseLossBackward>)
output :  tensor([[194302.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1994e+09, grad_fn=<MseLossBackward>)
output :  tensor([[167506.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(12293241., grad_fn=<MseLossBackward>)
output :  tensor([[162973.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(696.4651, grad_fn=<MseLossBackward>)
output :  tensor([[156485.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2293947., grad_fn=<MseLossBackward>)
output :  tensor([[151522.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2631644.2500, grad_fn=<MseLossBackward>)
output :  tensor([[172702.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9946e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159286.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(509126.8438, grad_fn=<MseLossBackward>)
output :  tensor([[371025.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6757e+08, grad_fn=<MseLossBackward>)
output :  tensor([[119159.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(61467072., grad_fn=<MseLossBackward>)
output :  tensor([[126454.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6773e+09, grad_fn=<MseLossBackward>)
output :  tensor([[277423.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(14358889., grad_fn=<MseLossBackward>)
output :  tensor([[162147.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(21719.3906, grad_fn=<MseLossBackward>)
output :  tensor([[131125.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1290e+08, grad_fn=<MseLossBackward>)
output :  tensor([[240786.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(77201208., grad_fn=<MseLossBackward>)
output :  tensor([[176992.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(12304749., grad_fn=<MseLossBackward>)
output :  tensor([[150731.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1609964.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140980.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(16155250., grad_fn=<MseLossBackward>)
output :  tensor([[156687.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9155e+08, grad_fn=<MseLossBackward>)
output :  tensor([[101374.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(1888498.6250, grad_fn=<MseLossBackward>)
output :  tensor([[79086.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6428e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165214.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(45896.3672, grad_fn=<MseLossBackward>)
output :  tensor([[187865.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6107e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159449.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2101503.2500, grad_fn=<MseLossBackward>)
output :  tensor([[159839.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(5473333.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138944.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2232176., grad_fn=<MseLossBackward>)
output :  tensor([[205417.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(283822.5625, grad_fn=<MseLossBackward>)
output :  tensor([[140225.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4954798., grad_fn=<MseLossBackward>)
output :  tensor([[183896.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5902e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145106.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(799124.2500, grad_fn=<MseLossBackward>)
output :  tensor([[110005.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2931e+08, grad_fn=<MseLossBackward>)
output :  tensor([[94638.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(407921.7188, grad_fn=<MseLossBackward>)
output :  tensor([[175175.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(30937.5117, grad_fn=<MseLossBackward>)
output :  tensor([[264583.]], grad_fn=<AddmmBackward>)
loss:  tensor(17497488., grad_fn=<MseLossBackward>)
output :  tensor([[141472.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(734.9182, grad_fn=<MseLossBackward>)
output :  tensor([[159070.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(679336.5625, grad_fn=<MseLossBackward>)
output :  tensor([[131419.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1167007.6250, grad_fn=<MseLossBackward>)
output :  tensor([[149837.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(114043.3984, grad_fn=<MseLossBackward>)
output :  tensor([[171240.]], grad_fn=<AddmmBackward>)
loss:  tensor(11155600., grad_fn=<MseLossBackward>)
output :  tensor([[128649.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2720695.5000, grad_fn=<MseLossBackward>)
output :  tensor([[173912.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3593e+08, grad_fn=<MseLossBackward>)
output :  tensor([[156021.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(957554., grad_fn=<MseLossBackward>)
output :  tensor([[116298.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(40687.3008, grad_fn=<MseLossBackward>)
output :  tensor([[161642.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0918e+09, grad_fn=<MseLossBackward>)
output :  tensor([[52697.1836]], grad_fn=<AddmmBackward>)
loss:  tensor(486064.9688, grad_fn=<MseLossBackward>)
output :  tensor([[230151.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7813e+09, grad_fn=<MseLossBackward>)
output :  tensor([[201199.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(39607.2188, grad_fn=<MseLossBackward>)
output :  tensor([[182271.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(7445479.5000, grad_fn=<MseLossBackward>)
output :  tensor([[104736.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(1595465., grad_fn=<MseLossBackward>)
output :  tensor([[90441.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(11846719., grad_fn=<MseLossBackward>)
output :  tensor([[138452.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2394466., grad_fn=<MseLossBackward>)
output :  tensor([[221828.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2087e+09, grad_fn=<MseLossBackward>)
output :  tensor([[206077.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2023239.5000, grad_fn=<MseLossBackward>)
output :  tensor([[157485.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(56473112., grad_fn=<MseLossBackward>)
output :  tensor([[172628.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5325e+09, grad_fn=<MseLossBackward>)
output :  tensor([[189649.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(122981.7188, grad_fn=<MseLossBackward>)
output :  tensor([[90219.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(10368350., grad_fn=<MseLossBackward>)
output :  tensor([[136572.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(11745935., grad_fn=<MseLossBackward>)
output :  tensor([[111444.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(892464., grad_fn=<MseLossBackward>)
output :  tensor([[147147.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2517e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174256.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8711e+09, grad_fn=<MseLossBackward>)
output :  tensor([[196241.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(76707768., grad_fn=<MseLossBackward>)
output :  tensor([[178246.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(3073118.5000, grad_fn=<MseLossBackward>)
output :  tensor([[96008.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(241387.9688, grad_fn=<MseLossBackward>)
output :  tensor([[118000.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(250140.6406, grad_fn=<MseLossBackward>)
output :  tensor([[162456.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6414e+08, grad_fn=<MseLossBackward>)
output :  tensor([[200822.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(676120.7500, grad_fn=<MseLossBackward>)
output :  tensor([[142325.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2804997., grad_fn=<MseLossBackward>)
train_loss: [2.6055903e+09]
epoch_result tensor([0.])
output :  tensor([[158117.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(146569.3438, grad_fn=<MseLossBackward>)
output :  tensor([[121653.1016]], grad_fn=<AddmmBackward>)
loss:  tensor(120338.5234, grad_fn=<MseLossBackward>)
output :  tensor([[197870.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(13465116., grad_fn=<MseLossBackward>)
output :  tensor([[175679.]], grad_fn=<AddmmBackward>)
loss:  tensor(1745041., grad_fn=<MseLossBackward>)
output :  tensor([[152810.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3450e+08, grad_fn=<MseLossBackward>)
output :  tensor([[127796.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(41466.3242, grad_fn=<MseLossBackward>)
output :  tensor([[142534.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2355793.2500, grad_fn=<MseLossBackward>)
output :  tensor([[119034.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1159.1897, grad_fn=<MseLossBackward>)
output :  tensor([[66781.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(68577288., grad_fn=<MseLossBackward>)
output :  tensor([[166844.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(712626.1250, grad_fn=<MseLossBackward>)
output :  tensor([[139574.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(181156.6406, grad_fn=<MseLossBackward>)
output :  tensor([[225529.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(280089.0312, grad_fn=<MseLossBackward>)
output :  tensor([[168864.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(18445.0352, grad_fn=<MseLossBackward>)
output :  tensor([[250647.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(898141.1875, grad_fn=<MseLossBackward>)
output :  tensor([[56711.4180]], grad_fn=<AddmmBackward>)
loss:  tensor(2928951.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162594.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2741e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177755.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(7593297., grad_fn=<MseLossBackward>)
output :  tensor([[172830.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6668e+08, grad_fn=<MseLossBackward>)
output :  tensor([[274078.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(849623.0625, grad_fn=<MseLossBackward>)
output :  tensor([[193908.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(9557469., grad_fn=<MseLossBackward>)
output :  tensor([[137290.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5740e+10, grad_fn=<MseLossBackward>)
output :  tensor([[200085.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(38515988., grad_fn=<MseLossBackward>)
output :  tensor([[181040.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9237e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150491.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(258731.1875, grad_fn=<MseLossBackward>)
output :  tensor([[172576.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(6640848.5000, grad_fn=<MseLossBackward>)
output :  tensor([[85640.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(58054.6445, grad_fn=<MseLossBackward>)
output :  tensor([[172158.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4998e+09, grad_fn=<MseLossBackward>)
output :  tensor([[183340.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2754718.2500, grad_fn=<MseLossBackward>)
output :  tensor([[208846.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1765e+09, grad_fn=<MseLossBackward>)
output :  tensor([[112987.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(8924129., grad_fn=<MseLossBackward>)
output :  tensor([[172022.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1044835.3125, grad_fn=<MseLossBackward>)
output :  tensor([[135640.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(739170.0625, grad_fn=<MseLossBackward>)
output :  tensor([[128066.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(870780.5625, grad_fn=<MseLossBackward>)
output :  tensor([[122113.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(6831444., grad_fn=<MseLossBackward>)
output :  tensor([[149143.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0332e+09, grad_fn=<MseLossBackward>)
output :  tensor([[167163.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1856e+10, grad_fn=<MseLossBackward>)
output :  tensor([[148580.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1253875., grad_fn=<MseLossBackward>)
output :  tensor([[182438.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(5948645., grad_fn=<MseLossBackward>)
output :  tensor([[141679.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(461762.7188, grad_fn=<MseLossBackward>)
output :  tensor([[106824.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8307e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133697.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6100e+09, grad_fn=<MseLossBackward>)
output :  tensor([[130873.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(17030968., grad_fn=<MseLossBackward>)
output :  tensor([[130628.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(13163574., grad_fn=<MseLossBackward>)
output :  tensor([[223303.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2879278.7500, grad_fn=<MseLossBackward>)
output :  tensor([[131364.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(783667.5625, grad_fn=<MseLossBackward>)
output :  tensor([[148402.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(357211.6562, grad_fn=<MseLossBackward>)
output :  tensor([[112446.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(199795.0312, grad_fn=<MseLossBackward>)
output :  tensor([[161356.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1839626., grad_fn=<MseLossBackward>)
output :  tensor([[145414.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4587e+09, grad_fn=<MseLossBackward>)
output :  tensor([[196578.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(20958228., grad_fn=<MseLossBackward>)
output :  tensor([[135693.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1546991.7500, grad_fn=<MseLossBackward>)
output :  tensor([[103107.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(47500848., grad_fn=<MseLossBackward>)
output :  tensor([[234559.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(313372.5312, grad_fn=<MseLossBackward>)
output :  tensor([[165983.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2568e+09, grad_fn=<MseLossBackward>)
output :  tensor([[162509.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(12313629., grad_fn=<MseLossBackward>)
output :  tensor([[205503.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7888e+10, grad_fn=<MseLossBackward>)
output :  tensor([[247677.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1304e+10, grad_fn=<MseLossBackward>)
output :  tensor([[140946.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(6518607., grad_fn=<MseLossBackward>)
output :  tensor([[133173.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(683231.3750, grad_fn=<MseLossBackward>)
output :  tensor([[158509.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(12313300., grad_fn=<MseLossBackward>)
output :  tensor([[134452.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(19828652., grad_fn=<MseLossBackward>)
output :  tensor([[179449.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4884e+09, grad_fn=<MseLossBackward>)
output :  tensor([[179775.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(18704814., grad_fn=<MseLossBackward>)
output :  tensor([[163309.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(3274686., grad_fn=<MseLossBackward>)
output :  tensor([[152424.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(88823848., grad_fn=<MseLossBackward>)
output :  tensor([[141872.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(393481.7812, grad_fn=<MseLossBackward>)
output :  tensor([[142514.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(6177555., grad_fn=<MseLossBackward>)
output :  tensor([[175801.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0813e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193654.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4502e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137959.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2130550.7500, grad_fn=<MseLossBackward>)
output :  tensor([[173956.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(4229513.5000, grad_fn=<MseLossBackward>)
output :  tensor([[179687.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1723928., grad_fn=<MseLossBackward>)
output :  tensor([[118333.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(11113889., grad_fn=<MseLossBackward>)
output :  tensor([[221619.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(383277.0625, grad_fn=<MseLossBackward>)
output :  tensor([[187985.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(20118870., grad_fn=<MseLossBackward>)
output :  tensor([[126539.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1080852.6250, grad_fn=<MseLossBackward>)
output :  tensor([[197973.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2171616.7500, grad_fn=<MseLossBackward>)
output :  tensor([[173151.]], grad_fn=<AddmmBackward>)
loss:  tensor(3059001., grad_fn=<MseLossBackward>)
output :  tensor([[206289.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2386e+10, grad_fn=<MseLossBackward>)
output :  tensor([[207559.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(11837040., grad_fn=<MseLossBackward>)
output :  tensor([[165220.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1710e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195378.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(771350.5000, grad_fn=<MseLossBackward>)
output :  tensor([[113890.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(792559., grad_fn=<MseLossBackward>)
output :  tensor([[113861.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(1853958.8750, grad_fn=<MseLossBackward>)
output :  tensor([[112137.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(18779.7051, grad_fn=<MseLossBackward>)
output :  tensor([[146560.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(57510.0352, grad_fn=<MseLossBackward>)
output :  tensor([[159795.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3433e+10, grad_fn=<MseLossBackward>)
output :  tensor([[177532.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(6089558.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128906.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1977670.8750, grad_fn=<MseLossBackward>)
output :  tensor([[140278.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(22294480., grad_fn=<MseLossBackward>)
output :  tensor([[184294.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4398e+09, grad_fn=<MseLossBackward>)
output :  tensor([[120941.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(16333217., grad_fn=<MseLossBackward>)
output :  tensor([[198761.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(3104313.7500, grad_fn=<MseLossBackward>)
output :  tensor([[146675.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2807457.2500, grad_fn=<MseLossBackward>)
output :  tensor([[209756.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(9880021., grad_fn=<MseLossBackward>)
output :  tensor([[128587.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(6697582.5000, grad_fn=<MseLossBackward>)
output :  tensor([[247403.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(854931.3750, grad_fn=<MseLossBackward>)
output :  tensor([[237244.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2806e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145500.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9881e+08, grad_fn=<MseLossBackward>)
output :  tensor([[86530.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5180e+08, grad_fn=<MseLossBackward>)
output :  tensor([[194010.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5432e+09, grad_fn=<MseLossBackward>)
output :  tensor([[80778.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(48972.3086, grad_fn=<MseLossBackward>)
output :  tensor([[140436.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(877793.3125, grad_fn=<MseLossBackward>)
output :  tensor([[74651.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(719461.8125, grad_fn=<MseLossBackward>)
output :  tensor([[143458.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(255767.2656, grad_fn=<MseLossBackward>)
output :  tensor([[176667.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(446203.1250, grad_fn=<MseLossBackward>)
output :  tensor([[155933.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(5921238., grad_fn=<MseLossBackward>)
output :  tensor([[109730.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(5430138., grad_fn=<MseLossBackward>)
output :  tensor([[205082.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2247e+10, grad_fn=<MseLossBackward>)
output :  tensor([[129769.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1612304.7500, grad_fn=<MseLossBackward>)
output :  tensor([[268643.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2897e+08, grad_fn=<MseLossBackward>)
output :  tensor([[307350.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(7019519., grad_fn=<MseLossBackward>)
output :  tensor([[108545.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(1093968.8750, grad_fn=<MseLossBackward>)
output :  tensor([[169823.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(7163987., grad_fn=<MseLossBackward>)
output :  tensor([[132831.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1659e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137318.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2829019., grad_fn=<MseLossBackward>)
output :  tensor([[128049.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(4841684.5000, grad_fn=<MseLossBackward>)
output :  tensor([[129330.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(18756208., grad_fn=<MseLossBackward>)
output :  tensor([[133623.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8195e+08, grad_fn=<MseLossBackward>)
output :  tensor([[226190.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8734e+10, grad_fn=<MseLossBackward>)
output :  tensor([[185920.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4050e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145097.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1433968.8750, grad_fn=<MseLossBackward>)
output :  tensor([[128708.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(1460717.7500, grad_fn=<MseLossBackward>)
output :  tensor([[111281.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1003.1077, grad_fn=<MseLossBackward>)
output :  tensor([[252432.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3071e+09, grad_fn=<MseLossBackward>)
output :  tensor([[133306.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2868048., grad_fn=<MseLossBackward>)
output :  tensor([[201287.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2933780.2500, grad_fn=<MseLossBackward>)
output :  tensor([[103674.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(1501333.2500, grad_fn=<MseLossBackward>)
output :  tensor([[140993.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1088175., grad_fn=<MseLossBackward>)
output :  tensor([[205354.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6655e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173843.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(36678920., grad_fn=<MseLossBackward>)
output :  tensor([[185267.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(71455.9688, grad_fn=<MseLossBackward>)
output :  tensor([[163704.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1111e+10, grad_fn=<MseLossBackward>)
output :  tensor([[302067.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0846e+09, grad_fn=<MseLossBackward>)
output :  tensor([[198675.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(600988.3125, grad_fn=<MseLossBackward>)
output :  tensor([[257188.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1220e+10, grad_fn=<MseLossBackward>)
output :  tensor([[221799.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9537e+09, grad_fn=<MseLossBackward>)
output :  tensor([[280539.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3294e+09, grad_fn=<MseLossBackward>)
output :  tensor([[220997.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(9015663., grad_fn=<MseLossBackward>)
output :  tensor([[223293.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8462e+10, grad_fn=<MseLossBackward>)
output :  tensor([[193933.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(9403806., grad_fn=<MseLossBackward>)
output :  tensor([[156913.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7915e+08, grad_fn=<MseLossBackward>)
output :  tensor([[132582.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(6826.8906, grad_fn=<MseLossBackward>)
output :  tensor([[136180.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(463548.2188, grad_fn=<MseLossBackward>)
output :  tensor([[90186.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(661528.0625, grad_fn=<MseLossBackward>)
output :  tensor([[109794.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(3219305., grad_fn=<MseLossBackward>)
output :  tensor([[275192.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8844e+09, grad_fn=<MseLossBackward>)
output :  tensor([[232299.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(7292194., grad_fn=<MseLossBackward>)
output :  tensor([[146681.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2827810., grad_fn=<MseLossBackward>)
output :  tensor([[139257.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3090509., grad_fn=<MseLossBackward>)
output :  tensor([[174407.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(454528.7812, grad_fn=<MseLossBackward>)
output :  tensor([[142633.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(6845009.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163642.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(9.5221e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163929.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1145000.3750, grad_fn=<MseLossBackward>)
output :  tensor([[137906.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(821147.4375, grad_fn=<MseLossBackward>)
output :  tensor([[187916.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2793e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113310.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(1717594.5000, grad_fn=<MseLossBackward>)
output :  tensor([[172559.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(313075.2188, grad_fn=<MseLossBackward>)
output :  tensor([[117148.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(8130295., grad_fn=<MseLossBackward>)
output :  tensor([[87089.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(8085.9434, grad_fn=<MseLossBackward>)
output :  tensor([[179087.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(832513.6875, grad_fn=<MseLossBackward>)
output :  tensor([[110490.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(348229.0625, grad_fn=<MseLossBackward>)
output :  tensor([[238004.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(991269.1250, grad_fn=<MseLossBackward>)
output :  tensor([[244032.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(935905.0625, grad_fn=<MseLossBackward>)
output :  tensor([[125523.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(15808949., grad_fn=<MseLossBackward>)
output :  tensor([[106163.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(7813379., grad_fn=<MseLossBackward>)
output :  tensor([[287028.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2538e+10, grad_fn=<MseLossBackward>)
output :  tensor([[173522.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(4090379.7500, grad_fn=<MseLossBackward>)
output :  tensor([[122506.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(6218477.5000, grad_fn=<MseLossBackward>)
output :  tensor([[143427.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4655e+08, grad_fn=<MseLossBackward>)
output :  tensor([[201228.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6312e+08, grad_fn=<MseLossBackward>)
output :  tensor([[141311.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(97100.4062, grad_fn=<MseLossBackward>)
output :  tensor([[157240.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5070e+10, grad_fn=<MseLossBackward>)
output :  tensor([[152986.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(834967.6250, grad_fn=<MseLossBackward>)
output :  tensor([[132815.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(10994820., grad_fn=<MseLossBackward>)
output :  tensor([[245313.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7739e+10, grad_fn=<MseLossBackward>)
output :  tensor([[397709.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(18406514., grad_fn=<MseLossBackward>)
output :  tensor([[105578.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(11708908., grad_fn=<MseLossBackward>)
output :  tensor([[114000.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(20243320., grad_fn=<MseLossBackward>)
output :  tensor([[157074.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(5883050., grad_fn=<MseLossBackward>)
output :  tensor([[129766.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8727e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163646.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4051e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173201.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9945e+09, grad_fn=<MseLossBackward>)
output :  tensor([[105435.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(3369863.2500, grad_fn=<MseLossBackward>)
output :  tensor([[139380.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2623286.2500, grad_fn=<MseLossBackward>)
output :  tensor([[364937.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(5552061.5000, grad_fn=<MseLossBackward>)
output :  tensor([[201483.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7579e+09, grad_fn=<MseLossBackward>)
output :  tensor([[178849.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(11216429., grad_fn=<MseLossBackward>)
output :  tensor([[209646.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(45515472., grad_fn=<MseLossBackward>)
output :  tensor([[143174.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(17423320., grad_fn=<MseLossBackward>)
output :  tensor([[197039.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(6448981., grad_fn=<MseLossBackward>)
output :  tensor([[135582.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8865e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178977.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4088863.2500, grad_fn=<MseLossBackward>)
output :  tensor([[240875.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1263516.5000, grad_fn=<MseLossBackward>)
output :  tensor([[172887.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1238629.8750, grad_fn=<MseLossBackward>)
output :  tensor([[110847.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(8106921.5000, grad_fn=<MseLossBackward>)
output :  tensor([[263498.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1129504., grad_fn=<MseLossBackward>)
output :  tensor([[247867.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(4547090., grad_fn=<MseLossBackward>)
output :  tensor([[125235.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(4997600., grad_fn=<MseLossBackward>)
output :  tensor([[216774.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3902e+09, grad_fn=<MseLossBackward>)
output :  tensor([[304026.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5258e+08, grad_fn=<MseLossBackward>)
output :  tensor([[205358.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2695497., grad_fn=<MseLossBackward>)
output :  tensor([[214571.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5732e+10, grad_fn=<MseLossBackward>)
output :  tensor([[158903.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1006792.7500, grad_fn=<MseLossBackward>)
output :  tensor([[168743.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1554697.2500, grad_fn=<MseLossBackward>)
output :  tensor([[160510.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(12803761., grad_fn=<MseLossBackward>)
output :  tensor([[171192.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1423174.5000, grad_fn=<MseLossBackward>)
output :  tensor([[239049.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3813e+08, grad_fn=<MseLossBackward>)
output :  tensor([[222089.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(54260720., grad_fn=<MseLossBackward>)
output :  tensor([[160989.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9571e+08, grad_fn=<MseLossBackward>)
output :  tensor([[122718.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(79519.5938, grad_fn=<MseLossBackward>)
output :  tensor([[174355.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(6993215., grad_fn=<MseLossBackward>)
output :  tensor([[181022.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2375e+09, grad_fn=<MseLossBackward>)
output :  tensor([[209422.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4297e+10, grad_fn=<MseLossBackward>)
output :  tensor([[133680.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(564212.2500, grad_fn=<MseLossBackward>)
output :  tensor([[148744.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3682e+08, grad_fn=<MseLossBackward>)
output :  tensor([[276555.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(197830.3594, grad_fn=<MseLossBackward>)
output :  tensor([[89351.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(18939020., grad_fn=<MseLossBackward>)
output :  tensor([[236882.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(146401.8906, grad_fn=<MseLossBackward>)
output :  tensor([[258302.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0539e+11, grad_fn=<MseLossBackward>)
output :  tensor([[170870.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(756981.5625, grad_fn=<MseLossBackward>)
output :  tensor([[195040.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5967e+09, grad_fn=<MseLossBackward>)
output :  tensor([[154845.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(23913.7227, grad_fn=<MseLossBackward>)
output :  tensor([[206558.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0248e+09, grad_fn=<MseLossBackward>)
output :  tensor([[130510.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2282885., grad_fn=<MseLossBackward>)
output :  tensor([[143266.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(3006051.5000, grad_fn=<MseLossBackward>)
output :  tensor([[170500.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8401e+08, grad_fn=<MseLossBackward>)
output :  tensor([[183101.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(7553823., grad_fn=<MseLossBackward>)
output :  tensor([[126841.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(707346.6875, grad_fn=<MseLossBackward>)
output :  tensor([[138483.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(3933032.7500, grad_fn=<MseLossBackward>)
output :  tensor([[171859.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1300811.5000, grad_fn=<MseLossBackward>)
output :  tensor([[196334.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8800e+09, grad_fn=<MseLossBackward>)
output :  tensor([[238705.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(18441120., grad_fn=<MseLossBackward>)
output :  tensor([[154024.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(951021.1250, grad_fn=<MseLossBackward>)
output :  tensor([[193377.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(6879063.5000, grad_fn=<MseLossBackward>)
output :  tensor([[160416.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6950e+08, grad_fn=<MseLossBackward>)
output :  tensor([[188514.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(81265152., grad_fn=<MseLossBackward>)
output :  tensor([[175300.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(21153962., grad_fn=<MseLossBackward>)
output :  tensor([[99261.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(5116114., grad_fn=<MseLossBackward>)
output :  tensor([[173900.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1257e+10, grad_fn=<MseLossBackward>)
output :  tensor([[137365.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(5595294.5000, grad_fn=<MseLossBackward>)
output :  tensor([[120495.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(30205672., grad_fn=<MseLossBackward>)
output :  tensor([[171965.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(4139699., grad_fn=<MseLossBackward>)
output :  tensor([[85446.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(199480.8750, grad_fn=<MseLossBackward>)
output :  tensor([[288884.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1243573.5000, grad_fn=<MseLossBackward>)
output :  tensor([[169430.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(19628914., grad_fn=<MseLossBackward>)
output :  tensor([[193348.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9550e+10, grad_fn=<MseLossBackward>)
output :  tensor([[243935.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3249e+08, grad_fn=<MseLossBackward>)
output :  tensor([[150732.]], grad_fn=<AddmmBackward>)
loss:  tensor(71824., grad_fn=<MseLossBackward>)
output :  tensor([[122557.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2080220.2500, grad_fn=<MseLossBackward>)
output :  tensor([[120739.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(705140.6875, grad_fn=<MseLossBackward>)
output :  tensor([[144711.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8279e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174392.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(153688.5000, grad_fn=<MseLossBackward>)
output :  tensor([[114090.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9795e+08, grad_fn=<MseLossBackward>)
output :  tensor([[210006.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1663e+10, grad_fn=<MseLossBackward>)
output :  tensor([[244252.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(7575138., grad_fn=<MseLossBackward>)
output :  tensor([[253509.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0074e+10, grad_fn=<MseLossBackward>)
output :  tensor([[220097.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5731e+08, grad_fn=<MseLossBackward>)
output :  tensor([[195555.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4387e+10, grad_fn=<MseLossBackward>)
output :  tensor([[190542.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(9259183., grad_fn=<MseLossBackward>)
output :  tensor([[206204.]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7815e+10, grad_fn=<MseLossBackward>)
output :  tensor([[187788.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1967e+10, grad_fn=<MseLossBackward>)
output :  tensor([[174058.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(21918490., grad_fn=<MseLossBackward>)
output :  tensor([[154936.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(8622115., grad_fn=<MseLossBackward>)
output :  tensor([[335180.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(3311035.2500, grad_fn=<MseLossBackward>)
output :  tensor([[210545.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2114934., grad_fn=<MseLossBackward>)
output :  tensor([[160226.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(51408.4766, grad_fn=<MseLossBackward>)
output :  tensor([[186738.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9989e+09, grad_fn=<MseLossBackward>)
output :  tensor([[110434.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(29529374., grad_fn=<MseLossBackward>)
output :  tensor([[273687.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9137e+10, grad_fn=<MseLossBackward>)
output :  tensor([[172886.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1026390.6250, grad_fn=<MseLossBackward>)
output :  tensor([[217765.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(18191292., grad_fn=<MseLossBackward>)
output :  tensor([[210069.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1948e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178747.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(204897.6875, grad_fn=<MseLossBackward>)
output :  tensor([[203549.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3059110.2500, grad_fn=<MseLossBackward>)
output :  tensor([[156350.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1822964.1250, grad_fn=<MseLossBackward>)
output :  tensor([[148387.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3414e+09, grad_fn=<MseLossBackward>)
output :  tensor([[118582.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(6738.1011, grad_fn=<MseLossBackward>)
output :  tensor([[139483.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(266368.8750, grad_fn=<MseLossBackward>)
output :  tensor([[148889.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(12158.5078, grad_fn=<MseLossBackward>)
output :  tensor([[201718.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5947e+10, grad_fn=<MseLossBackward>)
output :  tensor([[161045.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2388908.2500, grad_fn=<MseLossBackward>)
output :  tensor([[99600.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(10003.1250, grad_fn=<MseLossBackward>)
output :  tensor([[225192.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1927e+08, grad_fn=<MseLossBackward>)
output :  tensor([[188428.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2573e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174265.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(4926735., grad_fn=<MseLossBackward>)
output :  tensor([[84896.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(8389079., grad_fn=<MseLossBackward>)
output :  tensor([[129934.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(2057050.6250, grad_fn=<MseLossBackward>)
output :  tensor([[216539.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(6448504.5000, grad_fn=<MseLossBackward>)
output :  tensor([[143224.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(601376., grad_fn=<MseLossBackward>)
output :  tensor([[134688.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(21984524., grad_fn=<MseLossBackward>)
output :  tensor([[143162.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(316634.8125, grad_fn=<MseLossBackward>)
output :  tensor([[177413.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5931e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146338.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(5468655.5000, grad_fn=<MseLossBackward>)
output :  tensor([[160184.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(34161.4375, grad_fn=<MseLossBackward>)
output :  tensor([[215071.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(5139.0977, grad_fn=<MseLossBackward>)
output :  tensor([[137516.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0573e+09, grad_fn=<MseLossBackward>)
output :  tensor([[255151.]], grad_fn=<AddmmBackward>)
loss:  tensor(22801., grad_fn=<MseLossBackward>)
output :  tensor([[156419.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(9491887., grad_fn=<MseLossBackward>)
output :  tensor([[130556.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(4227329., grad_fn=<MseLossBackward>)
output :  tensor([[96279.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(1637260.2500, grad_fn=<MseLossBackward>)
output :  tensor([[154927.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9600e+09, grad_fn=<MseLossBackward>)
output :  tensor([[178654.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1551231.3750, grad_fn=<MseLossBackward>)
output :  tensor([[117390.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(9670594., grad_fn=<MseLossBackward>)
output :  tensor([[188166.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6633e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144223.]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1891e+09, grad_fn=<MseLossBackward>)
output :  tensor([[154248.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(18907142., grad_fn=<MseLossBackward>)
output :  tensor([[187868.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(14020.0400, grad_fn=<MseLossBackward>)
output :  tensor([[251130.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7595e+09, grad_fn=<MseLossBackward>)
output :  tensor([[91612.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(12565.0088, grad_fn=<MseLossBackward>)
output :  tensor([[237833.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(4693790., grad_fn=<MseLossBackward>)
output :  tensor([[127869.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(397894.8438, grad_fn=<MseLossBackward>)
output :  tensor([[164219.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0339e+10, grad_fn=<MseLossBackward>)
output :  tensor([[113025.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6966e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178053.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(4215835.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163128.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6306e+08, grad_fn=<MseLossBackward>)
output :  tensor([[155488.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2440e+08, grad_fn=<MseLossBackward>)
output :  tensor([[237496.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2260512.2500, grad_fn=<MseLossBackward>)
output :  tensor([[226285.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0058e+09, grad_fn=<MseLossBackward>)
output :  tensor([[124366.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(6933758.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128544.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(6475872., grad_fn=<MseLossBackward>)
output :  tensor([[223006.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(15945297., grad_fn=<MseLossBackward>)
output :  tensor([[229975.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(16192953., grad_fn=<MseLossBackward>)
output :  tensor([[231803.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(26048584., grad_fn=<MseLossBackward>)
output :  tensor([[147103.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(803040., grad_fn=<MseLossBackward>)
output :  tensor([[208903.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1201558.5000, grad_fn=<MseLossBackward>)
output :  tensor([[129815.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(96334840., grad_fn=<MseLossBackward>)
output :  tensor([[135332.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(8023145., grad_fn=<MseLossBackward>)
output :  tensor([[310465.]], grad_fn=<AddmmBackward>)
loss:  tensor(20566224., grad_fn=<MseLossBackward>)
output :  tensor([[144523.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(12412740., grad_fn=<MseLossBackward>)
output :  tensor([[122068.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0325e+09, grad_fn=<MseLossBackward>)
output :  tensor([[109094.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(164557., grad_fn=<MseLossBackward>)
output :  tensor([[156542.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5464e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178551.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2493e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174790.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(3204659.5000, grad_fn=<MseLossBackward>)
output :  tensor([[190613.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0787e+08, grad_fn=<MseLossBackward>)
output :  tensor([[95078.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(24223930., grad_fn=<MseLossBackward>)
output :  tensor([[178359.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(410400.3750, grad_fn=<MseLossBackward>)
output :  tensor([[173609.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(32596606., grad_fn=<MseLossBackward>)
output :  tensor([[142501.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(12260283., grad_fn=<MseLossBackward>)
output :  tensor([[261297.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(9.5653e+09, grad_fn=<MseLossBackward>)
output :  tensor([[140408.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0701e+09, grad_fn=<MseLossBackward>)
output :  tensor([[176560.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(12674156., grad_fn=<MseLossBackward>)
output :  tensor([[143956.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(15657231., grad_fn=<MseLossBackward>)
output :  tensor([[191881.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(74283656., grad_fn=<MseLossBackward>)
output :  tensor([[166210.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(14360429., grad_fn=<MseLossBackward>)
output :  tensor([[242126.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(3509651., grad_fn=<MseLossBackward>)
output :  tensor([[133078.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2021106.5000, grad_fn=<MseLossBackward>)
output :  tensor([[150833.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2200540.5000, grad_fn=<MseLossBackward>)
output :  tensor([[217187.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(4785908., grad_fn=<MseLossBackward>)
output :  tensor([[159631.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(28819618., grad_fn=<MseLossBackward>)
output :  tensor([[187724.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1626740.8750, grad_fn=<MseLossBackward>)
output :  tensor([[132585.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9771e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130432.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2052190.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139504.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(245830.0312, grad_fn=<MseLossBackward>)
output :  tensor([[201739.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5914e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166132.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6146e+09, grad_fn=<MseLossBackward>)
output :  tensor([[75617.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4390e+08, grad_fn=<MseLossBackward>)
output :  tensor([[94010.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(90448272., grad_fn=<MseLossBackward>)
output :  tensor([[252787.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(255862.0938, grad_fn=<MseLossBackward>)
output :  tensor([[204053.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2319e+09, grad_fn=<MseLossBackward>)
output :  tensor([[115408.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(167185.1562, grad_fn=<MseLossBackward>)
output :  tensor([[157034.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2817e+08, grad_fn=<MseLossBackward>)
output :  tensor([[208915.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2287e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181718.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7937e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158868.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(14968798., grad_fn=<MseLossBackward>)
output :  tensor([[165826.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(17415494., grad_fn=<MseLossBackward>)
output :  tensor([[114776.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(49753.3945, grad_fn=<MseLossBackward>)
output :  tensor([[161179.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(38188732., grad_fn=<MseLossBackward>)
output :  tensor([[194264.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5966e+08, grad_fn=<MseLossBackward>)
output :  tensor([[219694.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(37988.4453, grad_fn=<MseLossBackward>)
output :  tensor([[245997.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4900e+11, grad_fn=<MseLossBackward>)
output :  tensor([[144151.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(8114842.5000, grad_fn=<MseLossBackward>)
output :  tensor([[110999.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(6348156., grad_fn=<MseLossBackward>)
output :  tensor([[169889.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4425e+08, grad_fn=<MseLossBackward>)
output :  tensor([[152046.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2390164.2500, grad_fn=<MseLossBackward>)
output :  tensor([[232104.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(23968674., grad_fn=<MseLossBackward>)
output :  tensor([[116125.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(1266592., grad_fn=<MseLossBackward>)
output :  tensor([[183890.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(980502.2500, grad_fn=<MseLossBackward>)
output :  tensor([[186657.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1807.5784, grad_fn=<MseLossBackward>)
output :  tensor([[164282.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4248e+10, grad_fn=<MseLossBackward>)
output :  tensor([[93354.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5263e+08, grad_fn=<MseLossBackward>)
output :  tensor([[237117.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(3542982.7500, grad_fn=<MseLossBackward>)
output :  tensor([[177473.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2171478.5000, grad_fn=<MseLossBackward>)
output :  tensor([[141292.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1670839., grad_fn=<MseLossBackward>)
output :  tensor([[234614.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(148875.4062, grad_fn=<MseLossBackward>)
output :  tensor([[168754.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(33119666., grad_fn=<MseLossBackward>)
output :  tensor([[203674.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4720e+10, grad_fn=<MseLossBackward>)
output :  tensor([[132846.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(4636822., grad_fn=<MseLossBackward>)
output :  tensor([[185234.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3984e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136716.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(513529., grad_fn=<MseLossBackward>)
output :  tensor([[229835.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(37998364., grad_fn=<MseLossBackward>)
output :  tensor([[227019.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2809e+08, grad_fn=<MseLossBackward>)
output :  tensor([[90947.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(897178.9375, grad_fn=<MseLossBackward>)
output :  tensor([[157219.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(4903249., grad_fn=<MseLossBackward>)
output :  tensor([[247141.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5311e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145475.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(225803.1562, grad_fn=<MseLossBackward>)
output :  tensor([[109707.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8239e+09, grad_fn=<MseLossBackward>)
output :  tensor([[168485.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(15881470., grad_fn=<MseLossBackward>)
output :  tensor([[140856.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(9882378., grad_fn=<MseLossBackward>)
output :  tensor([[128737.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(288419.3438, grad_fn=<MseLossBackward>)
output :  tensor([[188025.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0374e+09, grad_fn=<MseLossBackward>)
output :  tensor([[122055.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(197517.7500, grad_fn=<MseLossBackward>)
output :  tensor([[151172.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(684213.3125, grad_fn=<MseLossBackward>)
output :  tensor([[167455.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(18438838., grad_fn=<MseLossBackward>)
output :  tensor([[151236.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(55880.5273, grad_fn=<MseLossBackward>)
output :  tensor([[158539.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(19012326., grad_fn=<MseLossBackward>)
output :  tensor([[135461.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0022e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130980.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1039412.1250, grad_fn=<MseLossBackward>)
output :  tensor([[153598.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1311e+08, grad_fn=<MseLossBackward>)
output :  tensor([[145551.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1957244.7500, grad_fn=<MseLossBackward>)
output :  tensor([[161542.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(43075.7070, grad_fn=<MseLossBackward>)
output :  tensor([[138496.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1774e+08, grad_fn=<MseLossBackward>)
output :  tensor([[147974.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(681863.0625, grad_fn=<MseLossBackward>)
output :  tensor([[186057.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3773670.5000, grad_fn=<MseLossBackward>)
output :  tensor([[173423.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(19565278., grad_fn=<MseLossBackward>)
output :  tensor([[180261.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(68153.6250, grad_fn=<MseLossBackward>)
output :  tensor([[218354.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2708133., grad_fn=<MseLossBackward>)
output :  tensor([[111495.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(12929025., grad_fn=<MseLossBackward>)
output :  tensor([[136849.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4279e+08, grad_fn=<MseLossBackward>)
output :  tensor([[287399.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1959912.5000, grad_fn=<MseLossBackward>)
output :  tensor([[117179.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(1391349.2500, grad_fn=<MseLossBackward>)
output :  tensor([[178643.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7104e+09, grad_fn=<MseLossBackward>)
output :  tensor([[185866.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(750307.8750, grad_fn=<MseLossBackward>)
output :  tensor([[187801.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(5298772.5000, grad_fn=<MseLossBackward>)
output :  tensor([[251469.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5371e+08, grad_fn=<MseLossBackward>)
output :  tensor([[220662.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1788655.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128807.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2474e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173072.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0291e+08, grad_fn=<MseLossBackward>)
output :  tensor([[125028.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1057201.6250, grad_fn=<MseLossBackward>)
output :  tensor([[184273.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4774e+10, grad_fn=<MseLossBackward>)
output :  tensor([[151895.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1220990.5000, grad_fn=<MseLossBackward>)
output :  tensor([[153789.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(53136584., grad_fn=<MseLossBackward>)
output :  tensor([[204745.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2416421.7500, grad_fn=<MseLossBackward>)
output :  tensor([[145141.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5980e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174839.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1345672.5000, grad_fn=<MseLossBackward>)
output :  tensor([[252692.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1865e+08, grad_fn=<MseLossBackward>)
output :  tensor([[147848.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(22810.4375, grad_fn=<MseLossBackward>)
output :  tensor([[203028.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(132223.1406, grad_fn=<MseLossBackward>)
output :  tensor([[162277.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(5417765.5000, grad_fn=<MseLossBackward>)
output :  tensor([[127305.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5449e+09, grad_fn=<MseLossBackward>)
output :  tensor([[139972.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(17828318., grad_fn=<MseLossBackward>)
output :  tensor([[184023.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(567.7795, grad_fn=<MseLossBackward>)
output :  tensor([[196117.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(37421896., grad_fn=<MseLossBackward>)
output :  tensor([[230427.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4307e+09, grad_fn=<MseLossBackward>)
output :  tensor([[254197.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(7853218., grad_fn=<MseLossBackward>)
output :  tensor([[186616.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7525e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144566.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8160e+09, grad_fn=<MseLossBackward>)
output :  tensor([[142659.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(3386520., grad_fn=<MseLossBackward>)
output :  tensor([[71972.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0223e+09, grad_fn=<MseLossBackward>)
output :  tensor([[133014.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(3940845.2500, grad_fn=<MseLossBackward>)
output :  tensor([[131424.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(6372311.5000, grad_fn=<MseLossBackward>)
output :  tensor([[153822.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(31367.7305, grad_fn=<MseLossBackward>)
output :  tensor([[127303.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(92240.3359, grad_fn=<MseLossBackward>)
output :  tensor([[77233.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(538733.0625, grad_fn=<MseLossBackward>)
output :  tensor([[82806.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(650442.2500, grad_fn=<MseLossBackward>)
output :  tensor([[231164.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(698869.8750, grad_fn=<MseLossBackward>)
output :  tensor([[140504.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8425e+08, grad_fn=<MseLossBackward>)
output :  tensor([[127672.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(7996921., grad_fn=<MseLossBackward>)
output :  tensor([[171341.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(18852422., grad_fn=<MseLossBackward>)
output :  tensor([[233662.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1788864.5000, grad_fn=<MseLossBackward>)
output :  tensor([[190570.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2462692.7500, grad_fn=<MseLossBackward>)
output :  tensor([[159101.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(9620659., grad_fn=<MseLossBackward>)
output :  tensor([[197964.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(4124.0479, grad_fn=<MseLossBackward>)
output :  tensor([[201155.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2849e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137895.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(802256.1250, grad_fn=<MseLossBackward>)
output :  tensor([[154915.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(7217.0332, grad_fn=<MseLossBackward>)
output :  tensor([[134376.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2636209., grad_fn=<MseLossBackward>)
output :  tensor([[198746.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(9.7681e+08, grad_fn=<MseLossBackward>)
output :  tensor([[156367.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(5602911., grad_fn=<MseLossBackward>)
output :  tensor([[137258.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9148e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146597.]], grad_fn=<AddmmBackward>)
loss:  tensor(2879809., grad_fn=<MseLossBackward>)
output :  tensor([[210701.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1685371.8750, grad_fn=<MseLossBackward>)
output :  tensor([[101234.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6996e+08, grad_fn=<MseLossBackward>)
output :  tensor([[168282.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(611890.6250, grad_fn=<MseLossBackward>)
output :  tensor([[125757.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(5029016.5000, grad_fn=<MseLossBackward>)
output :  tensor([[148095.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1200770.7500, grad_fn=<MseLossBackward>)
output :  tensor([[103521.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6924e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137672.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(29594.7500, grad_fn=<MseLossBackward>)
output :  tensor([[234623.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1894752.2500, grad_fn=<MseLossBackward>)
output :  tensor([[143207.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(3214344.7500, grad_fn=<MseLossBackward>)
output :  tensor([[138743.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1547069.5000, grad_fn=<MseLossBackward>)
output :  tensor([[166145.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4551e+09, grad_fn=<MseLossBackward>)
output :  tensor([[267012.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2072e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176951.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(3810060., grad_fn=<MseLossBackward>)
output :  tensor([[105982.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(10281091., grad_fn=<MseLossBackward>)
output :  tensor([[202767.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5850e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161481.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(6158695.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162814.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6058e+10, grad_fn=<MseLossBackward>)
output :  tensor([[100839.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(6450806.5000, grad_fn=<MseLossBackward>)
output :  tensor([[122377.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(1493723.2500, grad_fn=<MseLossBackward>)
output :  tensor([[156307.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(94383.3594, grad_fn=<MseLossBackward>)
output :  tensor([[142106.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(4437276.5000, grad_fn=<MseLossBackward>)
output :  tensor([[202347.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(5511343., grad_fn=<MseLossBackward>)
output :  tensor([[140621.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1900090., grad_fn=<MseLossBackward>)
output :  tensor([[260909.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1878869.8750, grad_fn=<MseLossBackward>)
output :  tensor([[128362.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2505e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166464.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(930380.8125, grad_fn=<MseLossBackward>)
output :  tensor([[190500.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(4000687.5000, grad_fn=<MseLossBackward>)
output :  tensor([[126557.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7414e+08, grad_fn=<MseLossBackward>)
output :  tensor([[261964.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4315e+08, grad_fn=<MseLossBackward>)
output :  tensor([[156411.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(9.3568e+08, grad_fn=<MseLossBackward>)
output :  tensor([[242559.]], grad_fn=<AddmmBackward>)
loss:  tensor(7789681., grad_fn=<MseLossBackward>)
output :  tensor([[145919.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(3683520.5000, grad_fn=<MseLossBackward>)
output :  tensor([[212133.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(4551089., grad_fn=<MseLossBackward>)
output :  tensor([[177161.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(22667568., grad_fn=<MseLossBackward>)
output :  tensor([[151501.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(6242814.5000, grad_fn=<MseLossBackward>)
output :  tensor([[118293.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(86009.3125, grad_fn=<MseLossBackward>)
output :  tensor([[234390.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7773e+09, grad_fn=<MseLossBackward>)
output :  tensor([[239255.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(554699.1250, grad_fn=<MseLossBackward>)
output :  tensor([[153446.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(12069.0820, grad_fn=<MseLossBackward>)
output :  tensor([[253116.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(3181931.2500, grad_fn=<MseLossBackward>)
output :  tensor([[123672.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(84059528., grad_fn=<MseLossBackward>)
output :  tensor([[176104.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(10959.4727, grad_fn=<MseLossBackward>)
output :  tensor([[160329.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(108724.7578, grad_fn=<MseLossBackward>)
output :  tensor([[137405.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(41026228., grad_fn=<MseLossBackward>)
output :  tensor([[193676.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1186e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163935.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(4188.5166, grad_fn=<MseLossBackward>)
output :  tensor([[164450.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2102817.2500, grad_fn=<MseLossBackward>)
output :  tensor([[157620.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(144020.2500, grad_fn=<MseLossBackward>)
output :  tensor([[142815.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(50184164., grad_fn=<MseLossBackward>)
output :  tensor([[173326.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0739e+09, grad_fn=<MseLossBackward>)
output :  tensor([[162253.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(5078825.5000, grad_fn=<MseLossBackward>)
output :  tensor([[377150.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(46507712., grad_fn=<MseLossBackward>)
output :  tensor([[130845.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(14784205., grad_fn=<MseLossBackward>)
output :  tensor([[127912.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7988e+09, grad_fn=<MseLossBackward>)
output :  tensor([[282308.]], grad_fn=<AddmmBackward>)
loss:  tensor(1199025., grad_fn=<MseLossBackward>)
output :  tensor([[159166.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(8030139., grad_fn=<MseLossBackward>)
output :  tensor([[133918.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8004e+08, grad_fn=<MseLossBackward>)
output :  tensor([[227195.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(23083520., grad_fn=<MseLossBackward>)
output :  tensor([[178816.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2833172.7500, grad_fn=<MseLossBackward>)
output :  tensor([[153897.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(3600565.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144118.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(776601.5625, grad_fn=<MseLossBackward>)
output :  tensor([[154856.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2245e+08, grad_fn=<MseLossBackward>)
output :  tensor([[98312.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2846285.2500, grad_fn=<MseLossBackward>)
output :  tensor([[77316.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9987e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166236.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1529164.1250, grad_fn=<MseLossBackward>)
output :  tensor([[188200.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5840e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158158.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(25241.2656, grad_fn=<MseLossBackward>)
output :  tensor([[156761.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(546051.7500, grad_fn=<MseLossBackward>)
output :  tensor([[134448.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(9006095., grad_fn=<MseLossBackward>)
output :  tensor([[207150.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1441838.1250, grad_fn=<MseLossBackward>)
output :  tensor([[137793.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(42539.0625, grad_fn=<MseLossBackward>)
output :  tensor([[184074.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5857e+10, grad_fn=<MseLossBackward>)
output :  tensor([[146669.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(448481.3438, grad_fn=<MseLossBackward>)
output :  tensor([[109833.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2005e+08, grad_fn=<MseLossBackward>)
output :  tensor([[93118.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(777910.2500, grad_fn=<MseLossBackward>)
output :  tensor([[173922.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1161039.8750, grad_fn=<MseLossBackward>)
output :  tensor([[262821.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(5863359.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138881.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(6855642., grad_fn=<MseLossBackward>)
output :  tensor([[159692.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(40867.1484, grad_fn=<MseLossBackward>)
output :  tensor([[133802.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1696669.1250, grad_fn=<MseLossBackward>)
output :  tensor([[147644.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(3443576., grad_fn=<MseLossBackward>)
output :  tensor([[168831.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(867430.3125, grad_fn=<MseLossBackward>)
output :  tensor([[126788.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(44695.9062, grad_fn=<MseLossBackward>)
output :  tensor([[173409.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0712e+08, grad_fn=<MseLossBackward>)
output :  tensor([[157504.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(254205.0312, grad_fn=<MseLossBackward>)
output :  tensor([[119134.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(6942072., grad_fn=<MseLossBackward>)
output :  tensor([[161187.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1571e+09, grad_fn=<MseLossBackward>)
output :  tensor([[53100.3555]], grad_fn=<AddmmBackward>)
loss:  tensor(1210782.1250, grad_fn=<MseLossBackward>)
output :  tensor([[233412.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2548e+09, grad_fn=<MseLossBackward>)
output :  tensor([[199696.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1699804.7500, grad_fn=<MseLossBackward>)
output :  tensor([[184558.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(195336.3750, grad_fn=<MseLossBackward>)
output :  tensor([[108726.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(7433546.5000, grad_fn=<MseLossBackward>)
output :  tensor([[85598.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1963238.8750, grad_fn=<MseLossBackward>)
output :  tensor([[141734.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3008381.7500, grad_fn=<MseLossBackward>)
output :  tensor([[221427.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2667e+09, grad_fn=<MseLossBackward>)
output :  tensor([[205294.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(4864644., grad_fn=<MseLossBackward>)
output :  tensor([[169537.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(20586922., grad_fn=<MseLossBackward>)
output :  tensor([[173298.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4093e+09, grad_fn=<MseLossBackward>)
output :  tensor([[187248.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(7572902., grad_fn=<MseLossBackward>)
output :  tensor([[87574.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(329664.3750, grad_fn=<MseLossBackward>)
output :  tensor([[138719.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1639920.3750, grad_fn=<MseLossBackward>)
output :  tensor([[106981.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(12381492., grad_fn=<MseLossBackward>)
output :  tensor([[148269.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5153e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173541.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8098e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195715.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(86201944., grad_fn=<MseLossBackward>)
output :  tensor([[179003.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(992420.6875, grad_fn=<MseLossBackward>)
output :  tensor([[98808.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(5327513., grad_fn=<MseLossBackward>)
output :  tensor([[117915.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(173049.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162540.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6052e+08, grad_fn=<MseLossBackward>)
output :  tensor([[198333.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2776285., grad_fn=<MseLossBackward>)
output :  tensor([[143653.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(119975.6406, grad_fn=<MseLossBackward>)
train_loss: [2.6042076e+09]
epoch_result tensor([0.])
output :  tensor([[158269.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(52907.1875, grad_fn=<MseLossBackward>)
output :  tensor([[123857.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(3449145.5000, grad_fn=<MseLossBackward>)
output :  tensor([[195258.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1118603.7500, grad_fn=<MseLossBackward>)
output :  tensor([[178211.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1468868.2500, grad_fn=<MseLossBackward>)
output :  tensor([[153487.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0084e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129852.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(3432277.2500, grad_fn=<MseLossBackward>)
output :  tensor([[141297.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(88357.5625, grad_fn=<MseLossBackward>)
output :  tensor([[119100.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(10189.9561, grad_fn=<MseLossBackward>)
output :  tensor([[68154.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(93207408., grad_fn=<MseLossBackward>)
output :  tensor([[167151.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1326024.2500, grad_fn=<MseLossBackward>)
output :  tensor([[153706.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8785e+08, grad_fn=<MseLossBackward>)
output :  tensor([[226997.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(3989507., grad_fn=<MseLossBackward>)
output :  tensor([[168316.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(466787.8750, grad_fn=<MseLossBackward>)
output :  tensor([[247710.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(3958421., grad_fn=<MseLossBackward>)
output :  tensor([[56183.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1401671., grad_fn=<MseLossBackward>)
output :  tensor([[161960.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0487e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166461.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(72902784., grad_fn=<MseLossBackward>)
output :  tensor([[167857.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2900e+08, grad_fn=<MseLossBackward>)
output :  tensor([[275727.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(528665.3125, grad_fn=<MseLossBackward>)
output :  tensor([[194906.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(4382611.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140621.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3918e+10, grad_fn=<MseLossBackward>)
output :  tensor([[194754.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(766363.4375, grad_fn=<MseLossBackward>)
output :  tensor([[180926.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9336e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151975.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(952515., grad_fn=<MseLossBackward>)
output :  tensor([[166382.]], grad_fn=<AddmmBackward>)
loss:  tensor(13089924., grad_fn=<MseLossBackward>)
output :  tensor([[85793.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(154916.0469, grad_fn=<MseLossBackward>)
output :  tensor([[170409.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2959e+09, grad_fn=<MseLossBackward>)
output :  tensor([[185981.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(962759.5625, grad_fn=<MseLossBackward>)
output :  tensor([[205364.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5136e+09, grad_fn=<MseLossBackward>)
output :  tensor([[110674.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(454760.5625, grad_fn=<MseLossBackward>)
output :  tensor([[170066.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(871305.5625, grad_fn=<MseLossBackward>)
output :  tensor([[138524.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(4098220.7500, grad_fn=<MseLossBackward>)
output :  tensor([[129484.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(234679.6875, grad_fn=<MseLossBackward>)
output :  tensor([[122032.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(6411222., grad_fn=<MseLossBackward>)
output :  tensor([[146924.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(8.9548e+08, grad_fn=<MseLossBackward>)
output :  tensor([[167546.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1742e+10, grad_fn=<MseLossBackward>)
output :  tensor([[151202.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2256661.2500, grad_fn=<MseLossBackward>)
output :  tensor([[182324.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(5402792., grad_fn=<MseLossBackward>)
output :  tensor([[138237.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(7631579., grad_fn=<MseLossBackward>)
output :  tensor([[104081.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9828e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134223.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5249e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136290.]], grad_fn=<AddmmBackward>)
loss:  tensor(1664100., grad_fn=<MseLossBackward>)
output :  tensor([[138520.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3272e+08, grad_fn=<MseLossBackward>)
output :  tensor([[221056.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(15547865., grad_fn=<MseLossBackward>)
output :  tensor([[132343.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(8660.6289, grad_fn=<MseLossBackward>)
output :  tensor([[150782.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(3177027.7500, grad_fn=<MseLossBackward>)
output :  tensor([[109775.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(4947670.5000, grad_fn=<MseLossBackward>)
output :  tensor([[160841.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(707806.7500, grad_fn=<MseLossBackward>)
output :  tensor([[145066.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4933e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193751.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(3067533.2500, grad_fn=<MseLossBackward>)
output :  tensor([[135311.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(742936.2500, grad_fn=<MseLossBackward>)
output :  tensor([[115826.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(33947920., grad_fn=<MseLossBackward>)
output :  tensor([[228034.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(35584580., grad_fn=<MseLossBackward>)
output :  tensor([[164305.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4191e+09, grad_fn=<MseLossBackward>)
output :  tensor([[153913.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(25873754., grad_fn=<MseLossBackward>)
output :  tensor([[202352.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8950e+10, grad_fn=<MseLossBackward>)
output :  tensor([[243880.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2126e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145897.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(5745983.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135437.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2065238.5000, grad_fn=<MseLossBackward>)
output :  tensor([[157412.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(5818121., grad_fn=<MseLossBackward>)
output :  tensor([[133782.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(14304706., grad_fn=<MseLossBackward>)
output :  tensor([[181076.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2289e+09, grad_fn=<MseLossBackward>)
output :  tensor([[180712.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(11477379., grad_fn=<MseLossBackward>)
output :  tensor([[160706.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(630039.0625, grad_fn=<MseLossBackward>)
output :  tensor([[138366.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(21465558., grad_fn=<MseLossBackward>)
output :  tensor([[144083.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2508957., grad_fn=<MseLossBackward>)
output :  tensor([[149782.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(22868868., grad_fn=<MseLossBackward>)
output :  tensor([[172323.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5377e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193441.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5500e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136697.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(38858.2656, grad_fn=<MseLossBackward>)
output :  tensor([[175164.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(10657368., grad_fn=<MseLossBackward>)
output :  tensor([[175557.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(29621316., grad_fn=<MseLossBackward>)
output :  tensor([[114133.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(750497.3750, grad_fn=<MseLossBackward>)
output :  tensor([[216357.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(21549904., grad_fn=<MseLossBackward>)
output :  tensor([[180108.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(11502802., grad_fn=<MseLossBackward>)
output :  tensor([[126421.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(849939.9375, grad_fn=<MseLossBackward>)
output :  tensor([[195384.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1245386.2500, grad_fn=<MseLossBackward>)
output :  tensor([[178218.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(11013376., grad_fn=<MseLossBackward>)
output :  tensor([[208939.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1439e+10, grad_fn=<MseLossBackward>)
output :  tensor([[207668.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(11097227., grad_fn=<MseLossBackward>)
output :  tensor([[165903.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2183e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193408.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1190656., grad_fn=<MseLossBackward>)
output :  tensor([[110970.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(4119980.2500, grad_fn=<MseLossBackward>)
output :  tensor([[114492.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(3969589.2500, grad_fn=<MseLossBackward>)
output :  tensor([[112648.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(421079.3125, grad_fn=<MseLossBackward>)
output :  tensor([[148031.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1517169.6250, grad_fn=<MseLossBackward>)
output :  tensor([[158729.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3824e+10, grad_fn=<MseLossBackward>)
output :  tensor([[180063.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(4064.0625, grad_fn=<MseLossBackward>)
output :  tensor([[126249.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(1563652.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144247.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(566867.8125, grad_fn=<MseLossBackward>)
output :  tensor([[181669.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1874e+09, grad_fn=<MseLossBackward>)
output :  tensor([[119077.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(4742050.5000, grad_fn=<MseLossBackward>)
output :  tensor([[191905.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(25951702., grad_fn=<MseLossBackward>)
output :  tensor([[144722.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(77179.7812, grad_fn=<MseLossBackward>)
output :  tensor([[218013.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(26152676., grad_fn=<MseLossBackward>)
output :  tensor([[126256.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(65604.0156, grad_fn=<MseLossBackward>)
output :  tensor([[248387.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(3568.1956, grad_fn=<MseLossBackward>)
output :  tensor([[239885.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0353e+09, grad_fn=<MseLossBackward>)
output :  tensor([[153162.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7359e+08, grad_fn=<MseLossBackward>)
output :  tensor([[86140.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3204e+08, grad_fn=<MseLossBackward>)
output :  tensor([[194097.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5290e+09, grad_fn=<MseLossBackward>)
output :  tensor([[83806.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(7876354.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138422.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1161208.2500, grad_fn=<MseLossBackward>)
output :  tensor([[76937.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2066046.8750, grad_fn=<MseLossBackward>)
output :  tensor([[143764.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(658278.6875, grad_fn=<MseLossBackward>)
output :  tensor([[174833.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1361670.2500, grad_fn=<MseLossBackward>)
output :  tensor([[152275.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1499515., grad_fn=<MseLossBackward>)
output :  tensor([[107286.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(12910.6406, grad_fn=<MseLossBackward>)
output :  tensor([[202902.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2735e+10, grad_fn=<MseLossBackward>)
output :  tensor([[129542.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(1086920.2500, grad_fn=<MseLossBackward>)
output :  tensor([[266217.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8995e+08, grad_fn=<MseLossBackward>)
output :  tensor([[300234.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(95357056., grad_fn=<MseLossBackward>)
output :  tensor([[107008.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(241142.3750, grad_fn=<MseLossBackward>)
output :  tensor([[172025.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(225283.7188, grad_fn=<MseLossBackward>)
output :  tensor([[132707.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1045e+08, grad_fn=<MseLossBackward>)
output :  tensor([[145849.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(46914152., grad_fn=<MseLossBackward>)
output :  tensor([[130076.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(30002.0293, grad_fn=<MseLossBackward>)
output :  tensor([[126245.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(1551912.5000, grad_fn=<MseLossBackward>)
output :  tensor([[137435.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8042e+08, grad_fn=<MseLossBackward>)
output :  tensor([[226413.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8646e+10, grad_fn=<MseLossBackward>)
output :  tensor([[188512.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3252e+10, grad_fn=<MseLossBackward>)
output :  tensor([[141564.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(5454341.5000, grad_fn=<MseLossBackward>)
output :  tensor([[123745.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(14098969., grad_fn=<MseLossBackward>)
output :  tensor([[114723.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(12064388., grad_fn=<MseLossBackward>)
output :  tensor([[253459.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1734e+09, grad_fn=<MseLossBackward>)
output :  tensor([[135473.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(223935.9844, grad_fn=<MseLossBackward>)
output :  tensor([[206201.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(10246601., grad_fn=<MseLossBackward>)
output :  tensor([[107832.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(8600793., grad_fn=<MseLossBackward>)
output :  tensor([[139491.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(210150.6094, grad_fn=<MseLossBackward>)
output :  tensor([[209232.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3310e+08, grad_fn=<MseLossBackward>)
output :  tensor([[183304.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(11589344., grad_fn=<MseLossBackward>)
output :  tensor([[185376.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(141728.7188, grad_fn=<MseLossBackward>)
output :  tensor([[164622.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0845e+10, grad_fn=<MseLossBackward>)
output :  tensor([[296235.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5027e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195517.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(5677646.5000, grad_fn=<MseLossBackward>)
output :  tensor([[261159.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0079e+10, grad_fn=<MseLossBackward>)
output :  tensor([[222595.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8839e+09, grad_fn=<MseLossBackward>)
output :  tensor([[283422.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1275e+09, grad_fn=<MseLossBackward>)
output :  tensor([[225165.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1358827.3750, grad_fn=<MseLossBackward>)
output :  tensor([[223478.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8399e+10, grad_fn=<MseLossBackward>)
output :  tensor([[198018.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1037915.2500, grad_fn=<MseLossBackward>)
output :  tensor([[157936.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3732e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131957.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(294424.9375, grad_fn=<MseLossBackward>)
output :  tensor([[131622.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(15035249., grad_fn=<MseLossBackward>)
output :  tensor([[92995.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(3983641.7500, grad_fn=<MseLossBackward>)
output :  tensor([[108161.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(26014.1621, grad_fn=<MseLossBackward>)
output :  tensor([[274505.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9588e+09, grad_fn=<MseLossBackward>)
output :  tensor([[234646.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(125304.9375, grad_fn=<MseLossBackward>)
output :  tensor([[146231.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1516707.7500, grad_fn=<MseLossBackward>)
output :  tensor([[135810.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2855255., grad_fn=<MseLossBackward>)
output :  tensor([[174201.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(219814.4688, grad_fn=<MseLossBackward>)
output :  tensor([[144603.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(417901.6562, grad_fn=<MseLossBackward>)
output :  tensor([[166952.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5888e+08, grad_fn=<MseLossBackward>)
output :  tensor([[168644.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(13284316., grad_fn=<MseLossBackward>)
output :  tensor([[136732.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(71673.3281, grad_fn=<MseLossBackward>)
output :  tensor([[187940.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2824e+09, grad_fn=<MseLossBackward>)
output :  tensor([[111846.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(23651.0762, grad_fn=<MseLossBackward>)
output :  tensor([[170190.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(3275025.5000, grad_fn=<MseLossBackward>)
output :  tensor([[121425.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2032896.7500, grad_fn=<MseLossBackward>)
output :  tensor([[86620.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(143919.4688, grad_fn=<MseLossBackward>)
output :  tensor([[179488.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(261280.7188, grad_fn=<MseLossBackward>)
output :  tensor([[108589.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(1717062.1250, grad_fn=<MseLossBackward>)
output :  tensor([[240877.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3524889., grad_fn=<MseLossBackward>)
output :  tensor([[246343.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1805706., grad_fn=<MseLossBackward>)
output :  tensor([[132167.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(7114972.5000, grad_fn=<MseLossBackward>)
output :  tensor([[109617.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(433385.6250, grad_fn=<MseLossBackward>)
output :  tensor([[291037.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1350e+10, grad_fn=<MseLossBackward>)
output :  tensor([[170788.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(506810.5000, grad_fn=<MseLossBackward>)
output :  tensor([[126229.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1512285., grad_fn=<MseLossBackward>)
output :  tensor([[146722.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2496e+08, grad_fn=<MseLossBackward>)
output :  tensor([[203108.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1863e+08, grad_fn=<MseLossBackward>)
output :  tensor([[140493.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(256178.3281, grad_fn=<MseLossBackward>)
output :  tensor([[157006.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5127e+10, grad_fn=<MseLossBackward>)
output :  tensor([[157048.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(9911675., grad_fn=<MseLossBackward>)
output :  tensor([[127481.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(4073364.5000, grad_fn=<MseLossBackward>)
output :  tensor([[245960.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7567e+10, grad_fn=<MseLossBackward>)
output :  tensor([[400747.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1568991.1250, grad_fn=<MseLossBackward>)
output :  tensor([[116570.1016]], grad_fn=<AddmmBackward>)
loss:  tensor(57306436., grad_fn=<MseLossBackward>)
output :  tensor([[123681.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(26848266., grad_fn=<MseLossBackward>)
output :  tensor([[157675.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(3329199.2500, grad_fn=<MseLossBackward>)
output :  tensor([[129207.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1469e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163421.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4314e+09, grad_fn=<MseLossBackward>)
output :  tensor([[172062.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8517e+09, grad_fn=<MseLossBackward>)
output :  tensor([[103118.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(232045.4219, grad_fn=<MseLossBackward>)
output :  tensor([[140597.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(162169.8125, grad_fn=<MseLossBackward>)
output :  tensor([[366836.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(209592.2812, grad_fn=<MseLossBackward>)
output :  tensor([[205467.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3554e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173149.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(5525952., grad_fn=<MseLossBackward>)
output :  tensor([[204947.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(4191552.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138466.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(284338.9062, grad_fn=<MseLossBackward>)
output :  tensor([[193488.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1023764.5625, grad_fn=<MseLossBackward>)
output :  tensor([[135394.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7812e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177596.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(11583068., grad_fn=<MseLossBackward>)
output :  tensor([[242525.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(276413.0625, grad_fn=<MseLossBackward>)
output :  tensor([[180220.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(38700648., grad_fn=<MseLossBackward>)
output :  tensor([[109433.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2054563.8750, grad_fn=<MseLossBackward>)
output :  tensor([[263628.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(870255.7500, grad_fn=<MseLossBackward>)
output :  tensor([[251056.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1116489.3750, grad_fn=<MseLossBackward>)
output :  tensor([[119285.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(13798671., grad_fn=<MseLossBackward>)
output :  tensor([[217139.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3479e+09, grad_fn=<MseLossBackward>)
output :  tensor([[303576.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7193e+08, grad_fn=<MseLossBackward>)
output :  tensor([[202713.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(18371672., grad_fn=<MseLossBackward>)
output :  tensor([[214812.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5672e+10, grad_fn=<MseLossBackward>)
output :  tensor([[159359.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2129456.2500, grad_fn=<MseLossBackward>)
output :  tensor([[171544.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2417684.7500, grad_fn=<MseLossBackward>)
output :  tensor([[161199.]], grad_fn=<AddmmBackward>)
loss:  tensor(18207288., grad_fn=<MseLossBackward>)
output :  tensor([[166124.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(15017199., grad_fn=<MseLossBackward>)
output :  tensor([[237622.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2276e+08, grad_fn=<MseLossBackward>)
output :  tensor([[218923.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1093e+08, grad_fn=<MseLossBackward>)
output :  tensor([[160568.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8411e+08, grad_fn=<MseLossBackward>)
output :  tensor([[124698.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2885698.5000, grad_fn=<MseLossBackward>)
output :  tensor([[178405.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1974947.1250, grad_fn=<MseLossBackward>)
output :  tensor([[181394.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1789e+09, grad_fn=<MseLossBackward>)
output :  tensor([[209563.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4245e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134665.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(54734.0664, grad_fn=<MseLossBackward>)
output :  tensor([[149485.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7760e+08, grad_fn=<MseLossBackward>)
output :  tensor([[279167.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(4696024.5000, grad_fn=<MseLossBackward>)
output :  tensor([[86366.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(1867044.7500, grad_fn=<MseLossBackward>)
output :  tensor([[235065.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2056580.1250, grad_fn=<MseLossBackward>)
output :  tensor([[264022.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0170e+11, grad_fn=<MseLossBackward>)
output :  tensor([[169462.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(289376.7500, grad_fn=<MseLossBackward>)
output :  tensor([[195227.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5819e+09, grad_fn=<MseLossBackward>)
output :  tensor([[155124.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(15441.9453, grad_fn=<MseLossBackward>)
output :  tensor([[205963.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1006e+09, grad_fn=<MseLossBackward>)
output :  tensor([[126902.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(4399637.5000, grad_fn=<MseLossBackward>)
output :  tensor([[150488.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(30118658., grad_fn=<MseLossBackward>)
output :  tensor([[169391.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2316e+08, grad_fn=<MseLossBackward>)
output :  tensor([[188320.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(6104451., grad_fn=<MseLossBackward>)
output :  tensor([[124896.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(1217143.3750, grad_fn=<MseLossBackward>)
output :  tensor([[139029.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(6397580., grad_fn=<MseLossBackward>)
output :  tensor([[179415.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(41158240., grad_fn=<MseLossBackward>)
output :  tensor([[197340.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7730e+09, grad_fn=<MseLossBackward>)
output :  tensor([[238793.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(17696482., grad_fn=<MseLossBackward>)
output :  tensor([[154422.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(333127.3750, grad_fn=<MseLossBackward>)
output :  tensor([[198233.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(4987964., grad_fn=<MseLossBackward>)
output :  tensor([[165239.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5113e+08, grad_fn=<MseLossBackward>)
output :  tensor([[185227.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(32808016., grad_fn=<MseLossBackward>)
output :  tensor([[181893.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(3973232.5000, grad_fn=<MseLossBackward>)
output :  tensor([[99509.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(6296806., grad_fn=<MseLossBackward>)
output :  tensor([[171360.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1803e+10, grad_fn=<MseLossBackward>)
output :  tensor([[136436.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2064430.1250, grad_fn=<MseLossBackward>)
output :  tensor([[124565.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(91507760., grad_fn=<MseLossBackward>)
output :  tensor([[172509.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(2221636.7500, grad_fn=<MseLossBackward>)
output :  tensor([[91326.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(40021044., grad_fn=<MseLossBackward>)
output :  tensor([[288075.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(3702016.5000, grad_fn=<MseLossBackward>)
output :  tensor([[166312.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1721631., grad_fn=<MseLossBackward>)
output :  tensor([[190258.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0423e+10, grad_fn=<MseLossBackward>)
output :  tensor([[248177.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2085e+08, grad_fn=<MseLossBackward>)
output :  tensor([[147594.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(11598069., grad_fn=<MseLossBackward>)
output :  tensor([[122680.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(1740977.1250, grad_fn=<MseLossBackward>)
output :  tensor([[113144.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(45631608., grad_fn=<MseLossBackward>)
output :  tensor([[146320.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(9.8095e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175899.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(3606616.5000, grad_fn=<MseLossBackward>)
output :  tensor([[110818.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0192e+08, grad_fn=<MseLossBackward>)
output :  tensor([[209260.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1824e+10, grad_fn=<MseLossBackward>)
output :  tensor([[227796.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8779e+08, grad_fn=<MseLossBackward>)
output :  tensor([[250965.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0801e+10, grad_fn=<MseLossBackward>)
output :  tensor([[219888.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6524e+08, grad_fn=<MseLossBackward>)
output :  tensor([[194732.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4585e+10, grad_fn=<MseLossBackward>)
output :  tensor([[188756.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1578753., grad_fn=<MseLossBackward>)
output :  tensor([[208186.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6952e+10, grad_fn=<MseLossBackward>)
output :  tensor([[190888.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1057e+10, grad_fn=<MseLossBackward>)
output :  tensor([[180156.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2006162.3750, grad_fn=<MseLossBackward>)
output :  tensor([[149190.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(7892939., grad_fn=<MseLossBackward>)
output :  tensor([[335364.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2675473.5000, grad_fn=<MseLossBackward>)
output :  tensor([[210448.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2407103.7500, grad_fn=<MseLossBackward>)
output :  tensor([[158333.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2776857.7500, grad_fn=<MseLossBackward>)
output :  tensor([[187195.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9489e+09, grad_fn=<MseLossBackward>)
output :  tensor([[109178.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(17461690., grad_fn=<MseLossBackward>)
output :  tensor([[272434.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9843e+10, grad_fn=<MseLossBackward>)
output :  tensor([[170841.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(9353084., grad_fn=<MseLossBackward>)
output :  tensor([[214925.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2032362.1250, grad_fn=<MseLossBackward>)
output :  tensor([[210055.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1979e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180068.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(754210.8125, grad_fn=<MseLossBackward>)
output :  tensor([[203103.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1700130.7500, grad_fn=<MseLossBackward>)
output :  tensor([[154644.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(126369.1406, grad_fn=<MseLossBackward>)
output :  tensor([[150196.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5197e+09, grad_fn=<MseLossBackward>)
output :  tensor([[120609.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(4449924.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140573.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(329332.5000, grad_fn=<MseLossBackward>)
output :  tensor([[148300.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(489278.4062, grad_fn=<MseLossBackward>)
output :  tensor([[199710.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6458e+10, grad_fn=<MseLossBackward>)
output :  tensor([[163218.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(13824570., grad_fn=<MseLossBackward>)
output :  tensor([[102138.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(6961352.5000, grad_fn=<MseLossBackward>)
output :  tensor([[225149.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2053e+08, grad_fn=<MseLossBackward>)
output :  tensor([[187198.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7081e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177575.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1188645., grad_fn=<MseLossBackward>)
output :  tensor([[81710.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(84095.4688, grad_fn=<MseLossBackward>)
output :  tensor([[129524.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(1049776.3750, grad_fn=<MseLossBackward>)
output :  tensor([[211391.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(6804761.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144559.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(312865.4375, grad_fn=<MseLossBackward>)
output :  tensor([[132933.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(8604689., grad_fn=<MseLossBackward>)
output :  tensor([[149054.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(41664200., grad_fn=<MseLossBackward>)
output :  tensor([[175493.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4435e+09, grad_fn=<MseLossBackward>)
output :  tensor([[143606.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(154793.0625, grad_fn=<MseLossBackward>)
output :  tensor([[161553.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2413653.5000, grad_fn=<MseLossBackward>)
output :  tensor([[213014.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(3943761.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135371.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2244e+08, grad_fn=<MseLossBackward>)
output :  tensor([[255591.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(349779.8438, grad_fn=<MseLossBackward>)
output :  tensor([[158785.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(510019.1562, grad_fn=<MseLossBackward>)
output :  tensor([[128558.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3396.7041, grad_fn=<MseLossBackward>)
output :  tensor([[95768.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(590124.0625, grad_fn=<MseLossBackward>)
output :  tensor([[153149.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7128e+09, grad_fn=<MseLossBackward>)
output :  tensor([[175875.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(16194462., grad_fn=<MseLossBackward>)
output :  tensor([[119618.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(777193.7500, grad_fn=<MseLossBackward>)
output :  tensor([[188961.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5990e+09, grad_fn=<MseLossBackward>)
output :  tensor([[142931.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0236e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150602.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(493923.4375, grad_fn=<MseLossBackward>)
output :  tensor([[185460.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(5239664., grad_fn=<MseLossBackward>)
output :  tensor([[253595.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5588e+09, grad_fn=<MseLossBackward>)
output :  tensor([[88688.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(7906245.5000, grad_fn=<MseLossBackward>)
output :  tensor([[236567.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(11779482., grad_fn=<MseLossBackward>)
output :  tensor([[131178.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(7174697., grad_fn=<MseLossBackward>)
output :  tensor([[165029.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0175e+10, grad_fn=<MseLossBackward>)
output :  tensor([[111672.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3624e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173491.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(6292572., grad_fn=<MseLossBackward>)
output :  tensor([[163722.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9160e+08, grad_fn=<MseLossBackward>)
output :  tensor([[154648.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8314e+08, grad_fn=<MseLossBackward>)
output :  tensor([[238318.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(464399.6562, grad_fn=<MseLossBackward>)
output :  tensor([[221807.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3099e+09, grad_fn=<MseLossBackward>)
output :  tensor([[125203.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(3225644., grad_fn=<MseLossBackward>)
output :  tensor([[127943.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3777799.5000, grad_fn=<MseLossBackward>)
output :  tensor([[225623.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1893806., grad_fn=<MseLossBackward>)
output :  tensor([[230416.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(12844384., grad_fn=<MseLossBackward>)
output :  tensor([[228363.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2767804., grad_fn=<MseLossBackward>)
output :  tensor([[146689.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1717287.3750, grad_fn=<MseLossBackward>)
output :  tensor([[215576.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(31097352., grad_fn=<MseLossBackward>)
output :  tensor([[131719.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3735e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133842.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1801383.3750, grad_fn=<MseLossBackward>)
output :  tensor([[309752.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(27540848., grad_fn=<MseLossBackward>)
output :  tensor([[140259.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(548618., grad_fn=<MseLossBackward>)
output :  tensor([[120700.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8838e+09, grad_fn=<MseLossBackward>)
output :  tensor([[106819.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(7182651.5000, grad_fn=<MseLossBackward>)
output :  tensor([[153503.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6085e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179122.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(9.1399e+09, grad_fn=<MseLossBackward>)
output :  tensor([[171456.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2383550., grad_fn=<MseLossBackward>)
output :  tensor([[191368.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(92767296., grad_fn=<MseLossBackward>)
output :  tensor([[102420.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(5859879.5000, grad_fn=<MseLossBackward>)
output :  tensor([[180535.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2358576., grad_fn=<MseLossBackward>)
output :  tensor([[170200.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(5293019., grad_fn=<MseLossBackward>)
output :  tensor([[138508.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(241848.7969, grad_fn=<MseLossBackward>)
output :  tensor([[260095.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(9.8020e+09, grad_fn=<MseLossBackward>)
output :  tensor([[141616.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2054e+09, grad_fn=<MseLossBackward>)
output :  tensor([[175725.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(7426476.5000, grad_fn=<MseLossBackward>)
output :  tensor([[141546.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2390695.7500, grad_fn=<MseLossBackward>)
output :  tensor([[199314.]], grad_fn=<AddmmBackward>)
loss:  tensor(1406596., grad_fn=<MseLossBackward>)
output :  tensor([[169191.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(652914.5000, grad_fn=<MseLossBackward>)
output :  tensor([[243966.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1145.3994, grad_fn=<MseLossBackward>)
output :  tensor([[132238.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(5114099.5000, grad_fn=<MseLossBackward>)
output :  tensor([[151168.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3306942.2500, grad_fn=<MseLossBackward>)
output :  tensor([[213382.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2615396.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162986.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(4054874.5000, grad_fn=<MseLossBackward>)
output :  tensor([[195378.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(40683868., grad_fn=<MseLossBackward>)
output :  tensor([[134828.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8424e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129748.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(559971.6250, grad_fn=<MseLossBackward>)
output :  tensor([[138727.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1619972.1250, grad_fn=<MseLossBackward>)
output :  tensor([[199976.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8336e+09, grad_fn=<MseLossBackward>)
output :  tensor([[165588.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5592e+09, grad_fn=<MseLossBackward>)
output :  tensor([[76858.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8422e+08, grad_fn=<MseLossBackward>)
output :  tensor([[94352.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(97070680., grad_fn=<MseLossBackward>)
output :  tensor([[260210.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(47847700., grad_fn=<MseLossBackward>)
output :  tensor([[204589.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3020e+09, grad_fn=<MseLossBackward>)
output :  tensor([[112453.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(6486174.5000, grad_fn=<MseLossBackward>)
output :  tensor([[159958.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5855e+08, grad_fn=<MseLossBackward>)
output :  tensor([[207303.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6120e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179821.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1321e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159183.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(17504026., grad_fn=<MseLossBackward>)
output :  tensor([[170079.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(6397.5000, grad_fn=<MseLossBackward>)
output :  tensor([[118285.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(10793843., grad_fn=<MseLossBackward>)
output :  tensor([[159688.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(21981740., grad_fn=<MseLossBackward>)
output :  tensor([[192926.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9527e+08, grad_fn=<MseLossBackward>)
output :  tensor([[217114.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(5690759.5000, grad_fn=<MseLossBackward>)
output :  tensor([[245484.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4952e+11, grad_fn=<MseLossBackward>)
output :  tensor([[148579.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2495659.5000, grad_fn=<MseLossBackward>)
output :  tensor([[110357.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(3524566.2500, grad_fn=<MseLossBackward>)
output :  tensor([[170800.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2320e+08, grad_fn=<MseLossBackward>)
output :  tensor([[156368.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(34443512., grad_fn=<MseLossBackward>)
output :  tensor([[234012.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(8923569., grad_fn=<MseLossBackward>)
output :  tensor([[115513.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(263217.0938, grad_fn=<MseLossBackward>)
output :  tensor([[180921.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(3916255.5000, grad_fn=<MseLossBackward>)
output :  tensor([[185912.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(619861., grad_fn=<MseLossBackward>)
output :  tensor([[164637.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4137e+10, grad_fn=<MseLossBackward>)
output :  tensor([[96471.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3935e+08, grad_fn=<MseLossBackward>)
output :  tensor([[239775.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(600843., grad_fn=<MseLossBackward>)
output :  tensor([[178221.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(4936728.5000, grad_fn=<MseLossBackward>)
output :  tensor([[142178.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(4745726., grad_fn=<MseLossBackward>)
output :  tensor([[235983.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(967764.0625, grad_fn=<MseLossBackward>)
output :  tensor([[163428.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(183652.4219, grad_fn=<MseLossBackward>)
output :  tensor([[204584.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4500e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134869.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(17058.8086, grad_fn=<MseLossBackward>)
output :  tensor([[186871.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1858e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135152.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(718203.3125, grad_fn=<MseLossBackward>)
output :  tensor([[229558.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(41496748., grad_fn=<MseLossBackward>)
output :  tensor([[227076.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2549e+08, grad_fn=<MseLossBackward>)
output :  tensor([[90221.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(48906.6328, grad_fn=<MseLossBackward>)
output :  tensor([[161689.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(5085166., grad_fn=<MseLossBackward>)
output :  tensor([[245769.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5652e+10, grad_fn=<MseLossBackward>)
output :  tensor([[146001.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1002220., grad_fn=<MseLossBackward>)
output :  tensor([[108692.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7383e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163926.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(328956.0312, grad_fn=<MseLossBackward>)
output :  tensor([[145287.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1657736.7500, grad_fn=<MseLossBackward>)
output :  tensor([[126795.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1973366.5000, grad_fn=<MseLossBackward>)
output :  tensor([[188555.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9624e+09, grad_fn=<MseLossBackward>)
output :  tensor([[123876.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1895956.8750, grad_fn=<MseLossBackward>)
output :  tensor([[150471.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2336933.2500, grad_fn=<MseLossBackward>)
output :  tensor([[167724.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(16207795., grad_fn=<MseLossBackward>)
output :  tensor([[150344.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(429823.6562, grad_fn=<MseLossBackward>)
output :  tensor([[163774.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(764777.5625, grad_fn=<MseLossBackward>)
output :  tensor([[136993.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8366e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135161.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(9994489., grad_fn=<MseLossBackward>)
output :  tensor([[154546.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4168e+08, grad_fn=<MseLossBackward>)
output :  tensor([[144700.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(301246.6250, grad_fn=<MseLossBackward>)
output :  tensor([[163641.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(3576412.7500, grad_fn=<MseLossBackward>)
output :  tensor([[137117.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4079e+08, grad_fn=<MseLossBackward>)
output :  tensor([[149614.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(663410.2500, grad_fn=<MseLossBackward>)
output :  tensor([[185935.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(4262870., grad_fn=<MseLossBackward>)
output :  tensor([[165900.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(9608450., grad_fn=<MseLossBackward>)
output :  tensor([[180947.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(897460.1875, grad_fn=<MseLossBackward>)
output :  tensor([[221199.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1438987.6250, grad_fn=<MseLossBackward>)
output :  tensor([[109126.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1504877.2500, grad_fn=<MseLossBackward>)
output :  tensor([[139169.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0361e+08, grad_fn=<MseLossBackward>)
output :  tensor([[279861.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(37683484., grad_fn=<MseLossBackward>)
output :  tensor([[119288.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(10814078., grad_fn=<MseLossBackward>)
output :  tensor([[176190.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9193e+09, grad_fn=<MseLossBackward>)
output :  tensor([[181880.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(9729038., grad_fn=<MseLossBackward>)
output :  tensor([[174380.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2363e+08, grad_fn=<MseLossBackward>)
output :  tensor([[253302.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7078e+08, grad_fn=<MseLossBackward>)
output :  tensor([[224061.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(4251264., grad_fn=<MseLossBackward>)
output :  tensor([[127600.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7093e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175239.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9458e+08, grad_fn=<MseLossBackward>)
output :  tensor([[121002.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(8986505., grad_fn=<MseLossBackward>)
output :  tensor([[184401.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4709e+10, grad_fn=<MseLossBackward>)
output :  tensor([[151038.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3847850., grad_fn=<MseLossBackward>)
output :  tensor([[152996.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(42210400., grad_fn=<MseLossBackward>)
output :  tensor([[203581.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(7390242., grad_fn=<MseLossBackward>)
output :  tensor([[145021.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5678e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175528.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(222621.7812, grad_fn=<MseLossBackward>)
output :  tensor([[250652.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3217e+08, grad_fn=<MseLossBackward>)
output :  tensor([[149144.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1310237.8750, grad_fn=<MseLossBackward>)
output :  tensor([[199304.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(11295901., grad_fn=<MseLossBackward>)
output :  tensor([[159826.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(15163.6133, grad_fn=<MseLossBackward>)
output :  tensor([[124218.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3118e+09, grad_fn=<MseLossBackward>)
output :  tensor([[133979.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(3135279., grad_fn=<MseLossBackward>)
output :  tensor([[179694.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(18535984., grad_fn=<MseLossBackward>)
output :  tensor([[197623.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(58114416., grad_fn=<MseLossBackward>)
output :  tensor([[230725.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3959e+09, grad_fn=<MseLossBackward>)
output :  tensor([[256676.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(104399.6719, grad_fn=<MseLossBackward>)
output :  tensor([[186510.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7553e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144586.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8182e+09, grad_fn=<MseLossBackward>)
output :  tensor([[143327.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1375159.3750, grad_fn=<MseLossBackward>)
output :  tensor([[72074.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0288e+09, grad_fn=<MseLossBackward>)
output :  tensor([[141786.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(46056584., grad_fn=<MseLossBackward>)
output :  tensor([[129627.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(529472.2500, grad_fn=<MseLossBackward>)
output :  tensor([[154229.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(52770.7031, grad_fn=<MseLossBackward>)
output :  tensor([[126418.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(337660.8750, grad_fn=<MseLossBackward>)
output :  tensor([[76890.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(152532.9688, grad_fn=<MseLossBackward>)
output :  tensor([[83124.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(1263780., grad_fn=<MseLossBackward>)
output :  tensor([[243056.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2225e+08, grad_fn=<MseLossBackward>)
output :  tensor([[139162.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1091e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134851.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(18939088., grad_fn=<MseLossBackward>)
output :  tensor([[168620.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2626526.7500, grad_fn=<MseLossBackward>)
output :  tensor([[233412.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2519461.7500, grad_fn=<MseLossBackward>)
output :  tensor([[189923.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(4914257.5000, grad_fn=<MseLossBackward>)
output :  tensor([[154763.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1529975.7500, grad_fn=<MseLossBackward>)
output :  tensor([[199276.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1894623.2500, grad_fn=<MseLossBackward>)
output :  tensor([[203816.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1011e+09, grad_fn=<MseLossBackward>)
output :  tensor([[139447.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(5991786., grad_fn=<MseLossBackward>)
output :  tensor([[154757.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(58685.0625, grad_fn=<MseLossBackward>)
output :  tensor([[135512.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(237641.0156, grad_fn=<MseLossBackward>)
output :  tensor([[198434.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9637e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148605.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(29102822., grad_fn=<MseLossBackward>)
output :  tensor([[137549.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9404e+09, grad_fn=<MseLossBackward>)
output :  tensor([[147093.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(4809523., grad_fn=<MseLossBackward>)
output :  tensor([[207361.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(21514088., grad_fn=<MseLossBackward>)
output :  tensor([[105747.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6396e+08, grad_fn=<MseLossBackward>)
output :  tensor([[164590.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(8466918., grad_fn=<MseLossBackward>)
output :  tensor([[128132.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(17434.3145, grad_fn=<MseLossBackward>)
output :  tensor([[146265.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(539513.1875, grad_fn=<MseLossBackward>)
output :  tensor([[106693.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9634e+09, grad_fn=<MseLossBackward>)
output :  tensor([[139549.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(4201667., grad_fn=<MseLossBackward>)
output :  tensor([[236358.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(128611.8906, grad_fn=<MseLossBackward>)
output :  tensor([[146512.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2289074.5000, grad_fn=<MseLossBackward>)
output :  tensor([[137729.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(52483.9453, grad_fn=<MseLossBackward>)
output :  tensor([[164035.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2986e+09, grad_fn=<MseLossBackward>)
output :  tensor([[270501.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(56230784., grad_fn=<MseLossBackward>)
output :  tensor([[171514.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(12148819., grad_fn=<MseLossBackward>)
output :  tensor([[105275.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(6245977., grad_fn=<MseLossBackward>)
output :  tensor([[200094.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9916e+09, grad_fn=<MseLossBackward>)
output :  tensor([[162985.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(15882716., grad_fn=<MseLossBackward>)
output :  tensor([[161943.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6433e+10, grad_fn=<MseLossBackward>)
output :  tensor([[98431.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(17189.6680, grad_fn=<MseLossBackward>)
output :  tensor([[127102.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(12265044., grad_fn=<MseLossBackward>)
output :  tensor([[155080.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(845566.4375, grad_fn=<MseLossBackward>)
output :  tensor([[141768.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(3127758., grad_fn=<MseLossBackward>)
output :  tensor([[200221.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(49138.4219, grad_fn=<MseLossBackward>)
output :  tensor([[144249.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(5061375., grad_fn=<MseLossBackward>)
output :  tensor([[267860.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(31145468., grad_fn=<MseLossBackward>)
output :  tensor([[128207.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2396e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164632.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(753098.5625, grad_fn=<MseLossBackward>)
output :  tensor([[187816.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(467193.6250, grad_fn=<MseLossBackward>)
output :  tensor([[123049.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7029e+08, grad_fn=<MseLossBackward>)
output :  tensor([[250493.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(243603.9375, grad_fn=<MseLossBackward>)
output :  tensor([[158390.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1851e+08, grad_fn=<MseLossBackward>)
output :  tensor([[245635.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(81724.5156, grad_fn=<MseLossBackward>)
output :  tensor([[141007.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(8956272., grad_fn=<MseLossBackward>)
output :  tensor([[208239.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(3098315., grad_fn=<MseLossBackward>)
output :  tensor([[169705.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(7258646.5000, grad_fn=<MseLossBackward>)
output :  tensor([[154089.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(7929.3457, grad_fn=<MseLossBackward>)
output :  tensor([[116722.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1632485.3750, grad_fn=<MseLossBackward>)
output :  tensor([[239656.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2500e+09, grad_fn=<MseLossBackward>)
output :  tensor([[235846.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(17253380., grad_fn=<MseLossBackward>)
output :  tensor([[153315.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(470.3477, grad_fn=<MseLossBackward>)
output :  tensor([[255127.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(51742.0312, grad_fn=<MseLossBackward>)
output :  tensor([[122322.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(61136516., grad_fn=<MseLossBackward>)
output :  tensor([[175850.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(22219.6289, grad_fn=<MseLossBackward>)
output :  tensor([[161792.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(3211320., grad_fn=<MseLossBackward>)
output :  tensor([[133949.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(8701025., grad_fn=<MseLossBackward>)
output :  tensor([[191848.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8873e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164668.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(447310.1562, grad_fn=<MseLossBackward>)
output :  tensor([[166107.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(9657527., grad_fn=<MseLossBackward>)
output :  tensor([[155802.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(4829487., grad_fn=<MseLossBackward>)
output :  tensor([[152519.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(6861043.5000, grad_fn=<MseLossBackward>)
output :  tensor([[172644.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9872e+09, grad_fn=<MseLossBackward>)
output :  tensor([[160940.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(883952.5625, grad_fn=<MseLossBackward>)
output :  tensor([[377634.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(40134204., grad_fn=<MseLossBackward>)
output :  tensor([[120987.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(36144612., grad_fn=<MseLossBackward>)
output :  tensor([[130951.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0658e+09, grad_fn=<MseLossBackward>)
output :  tensor([[280982.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(53159.0664, grad_fn=<MseLossBackward>)
output :  tensor([[161626.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(139198.9531, grad_fn=<MseLossBackward>)
output :  tensor([[131642.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2416e+08, grad_fn=<MseLossBackward>)
output :  tensor([[237314.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(28243246., grad_fn=<MseLossBackward>)
output :  tensor([[181268.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(590208.0625, grad_fn=<MseLossBackward>)
output :  tensor([[155798.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(14429433., grad_fn=<MseLossBackward>)
output :  tensor([[145388.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(150944.3906, grad_fn=<MseLossBackward>)
output :  tensor([[153640.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8025e+08, grad_fn=<MseLossBackward>)
output :  tensor([[103848.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(14811433., grad_fn=<MseLossBackward>)
output :  tensor([[76640.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7691e+08, grad_fn=<MseLossBackward>)
output :  tensor([[164311.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(473709.5625, grad_fn=<MseLossBackward>)
output :  tensor([[184783.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8677e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158724.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(524741.7500, grad_fn=<MseLossBackward>)
output :  tensor([[159303.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(3254077.7500, grad_fn=<MseLossBackward>)
output :  tensor([[138569.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1252265.8750, grad_fn=<MseLossBackward>)
output :  tensor([[204626.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1751693.6250, grad_fn=<MseLossBackward>)
output :  tensor([[140840.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(8066310., grad_fn=<MseLossBackward>)
output :  tensor([[182681.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6210e+10, grad_fn=<MseLossBackward>)
output :  tensor([[146876.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(767512.8750, grad_fn=<MseLossBackward>)
output :  tensor([[113083.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(9.0501e+08, grad_fn=<MseLossBackward>)
output :  tensor([[94287.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(82908., grad_fn=<MseLossBackward>)
output :  tensor([[175152.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(23332.5625, grad_fn=<MseLossBackward>)
output :  tensor([[256191.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(17707528., grad_fn=<MseLossBackward>)
output :  tensor([[142129.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(396348.9375, grad_fn=<MseLossBackward>)
output :  tensor([[160969.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1153912.3750, grad_fn=<MseLossBackward>)
output :  tensor([[130850.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2720489.5000, grad_fn=<MseLossBackward>)
output :  tensor([[147461.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(4155800.7500, grad_fn=<MseLossBackward>)
output :  tensor([[169279.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1901856.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128029.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1059066.1250, grad_fn=<MseLossBackward>)
output :  tensor([[170019.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2599e+08, grad_fn=<MseLossBackward>)
output :  tensor([[157747.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(558592.7500, grad_fn=<MseLossBackward>)
output :  tensor([[120063.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(12698421., grad_fn=<MseLossBackward>)
output :  tensor([[163574.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8199e+09, grad_fn=<MseLossBackward>)
output :  tensor([[51029.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(941748.9375, grad_fn=<MseLossBackward>)
output :  tensor([[230248.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7654e+09, grad_fn=<MseLossBackward>)
output :  tensor([[201419.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(175993.3594, grad_fn=<MseLossBackward>)
output :  tensor([[185666.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(444472.2188, grad_fn=<MseLossBackward>)
output :  tensor([[105648.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(123623.6562, grad_fn=<MseLossBackward>)
output :  tensor([[92131.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(26334698., grad_fn=<MseLossBackward>)
output :  tensor([[137059.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(8648378., grad_fn=<MseLossBackward>)
output :  tensor([[220083.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4637e+09, grad_fn=<MseLossBackward>)
output :  tensor([[201275.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(38739536., grad_fn=<MseLossBackward>)
output :  tensor([[164695.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(92691.7031, grad_fn=<MseLossBackward>)
output :  tensor([[172835.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4944e+09, grad_fn=<MseLossBackward>)
output :  tensor([[189566.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(188057.7500, grad_fn=<MseLossBackward>)
output :  tensor([[86810.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(36040.6484, grad_fn=<MseLossBackward>)
output :  tensor([[138454.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2387459.5000, grad_fn=<MseLossBackward>)
output :  tensor([[109905.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(353105.2188, grad_fn=<MseLossBackward>)
output :  tensor([[147550.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3435e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172812.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7483e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194001.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2096e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177359.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(6973065.5000, grad_fn=<MseLossBackward>)
output :  tensor([[98455.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3825630.5000, grad_fn=<MseLossBackward>)
output :  tensor([[115909.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2528249., grad_fn=<MseLossBackward>)
output :  tensor([[160149.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6883e+08, grad_fn=<MseLossBackward>)
output :  tensor([[200984.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(969055.6875, grad_fn=<MseLossBackward>)
output :  tensor([[147146.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(9902232., grad_fn=<MseLossBackward>)
train_loss: [2.597601e+09]
epoch_result tensor([0.])
output :  tensor([[159750.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1562851.6250, grad_fn=<MseLossBackward>)
output :  tensor([[120409.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(2528373.2500, grad_fn=<MseLossBackward>)
output :  tensor([[195928.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2983284.5000, grad_fn=<MseLossBackward>)
output :  tensor([[175778.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1492749.3750, grad_fn=<MseLossBackward>)
output :  tensor([[151012.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2834e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131577.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(12799960., grad_fn=<MseLossBackward>)
output :  tensor([[139920.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1164881.7500, grad_fn=<MseLossBackward>)
output :  tensor([[118105.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(799752.9375, grad_fn=<MseLossBackward>)
output :  tensor([[66959.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(71558776., grad_fn=<MseLossBackward>)
output :  tensor([[165676.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(104399.6719, grad_fn=<MseLossBackward>)
output :  tensor([[144701.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(22105130., grad_fn=<MseLossBackward>)
output :  tensor([[221245.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(14096036., grad_fn=<MseLossBackward>)
output :  tensor([[169390.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(152795.4844, grad_fn=<MseLossBackward>)
output :  tensor([[249260.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(193064.1250, grad_fn=<MseLossBackward>)
output :  tensor([[54059.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(884026., grad_fn=<MseLossBackward>)
output :  tensor([[160754.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6419e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174404.]], grad_fn=<AddmmBackward>)
loss:  tensor(355216., grad_fn=<MseLossBackward>)
output :  tensor([[158632.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(4546690., grad_fn=<MseLossBackward>)
output :  tensor([[275256.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(65840.3516, grad_fn=<MseLossBackward>)
output :  tensor([[196209.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(625186.7500, grad_fn=<MseLossBackward>)
output :  tensor([[136398.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6232e+10, grad_fn=<MseLossBackward>)
output :  tensor([[195241.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1856789.5000, grad_fn=<MseLossBackward>)
output :  tensor([[176841.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3096e+09, grad_fn=<MseLossBackward>)
output :  tensor([[153663.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(7094315.5000, grad_fn=<MseLossBackward>)
output :  tensor([[173249.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(10557524., grad_fn=<MseLossBackward>)
output :  tensor([[84524.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(767334.9375, grad_fn=<MseLossBackward>)
output :  tensor([[170519.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3084e+09, grad_fn=<MseLossBackward>)
output :  tensor([[184764.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(55416.1016, grad_fn=<MseLossBackward>)
output :  tensor([[205923.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4579e+09, grad_fn=<MseLossBackward>)
output :  tensor([[108583.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2007224.8750, grad_fn=<MseLossBackward>)
output :  tensor([[173158.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(4660066.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135237.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1593985.1250, grad_fn=<MseLossBackward>)
output :  tensor([[130340.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(1795914.1250, grad_fn=<MseLossBackward>)
output :  tensor([[122755.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(10599196., grad_fn=<MseLossBackward>)
output :  tensor([[146327.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(8.6010e+08, grad_fn=<MseLossBackward>)
output :  tensor([[169930.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1045e+10, grad_fn=<MseLossBackward>)
output :  tensor([[150628.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(862489.5000, grad_fn=<MseLossBackward>)
output :  tensor([[180682.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(465230.5625, grad_fn=<MseLossBackward>)
output :  tensor([[146183.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(26871102., grad_fn=<MseLossBackward>)
output :  tensor([[108361.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3714e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135723.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2848e+09, grad_fn=<MseLossBackward>)
output :  tensor([[132507.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(6213335., grad_fn=<MseLossBackward>)
output :  tensor([[137240.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0487e+08, grad_fn=<MseLossBackward>)
output :  tensor([[224596.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(162774.4219, grad_fn=<MseLossBackward>)
output :  tensor([[132717.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(218570.8594, grad_fn=<MseLossBackward>)
output :  tensor([[150498.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2245502.2500, grad_fn=<MseLossBackward>)
output :  tensor([[115881.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(15063192., grad_fn=<MseLossBackward>)
output :  tensor([[158152.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(3412621.2500, grad_fn=<MseLossBackward>)
output :  tensor([[147094.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2949e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195912.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(15307412., grad_fn=<MseLossBackward>)
output :  tensor([[134637.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(35050.8594, grad_fn=<MseLossBackward>)
output :  tensor([[101805.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(67142024., grad_fn=<MseLossBackward>)
output :  tensor([[233161.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(703265.6875, grad_fn=<MseLossBackward>)
output :  tensor([[167085.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1534e+09, grad_fn=<MseLossBackward>)
output :  tensor([[168438.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(89077024., grad_fn=<MseLossBackward>)
output :  tensor([[202159.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9016e+10, grad_fn=<MseLossBackward>)
output :  tensor([[250161.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0782e+10, grad_fn=<MseLossBackward>)
output :  tensor([[142769.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(532922.8125, grad_fn=<MseLossBackward>)
output :  tensor([[135144.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1310703., grad_fn=<MseLossBackward>)
output :  tensor([[152965.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(4139826., grad_fn=<MseLossBackward>)
output :  tensor([[133980.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(15844753., grad_fn=<MseLossBackward>)
output :  tensor([[178648.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6180e+09, grad_fn=<MseLossBackward>)
output :  tensor([[181773.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(5412384., grad_fn=<MseLossBackward>)
output :  tensor([[167783.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(39482568., grad_fn=<MseLossBackward>)
output :  tensor([[149866.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(47146892., grad_fn=<MseLossBackward>)
output :  tensor([[145214.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(7368256., grad_fn=<MseLossBackward>)
output :  tensor([[143860.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1299315., grad_fn=<MseLossBackward>)
output :  tensor([[173169.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4244e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192947.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7854e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136083.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(173875.9688, grad_fn=<MseLossBackward>)
output :  tensor([[172756.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(734181.1875, grad_fn=<MseLossBackward>)
output :  tensor([[178908.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(4374764.5000, grad_fn=<MseLossBackward>)
output :  tensor([[116890.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(3573340.5000, grad_fn=<MseLossBackward>)
output :  tensor([[218732.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(5139926.5000, grad_fn=<MseLossBackward>)
output :  tensor([[182982.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(267951.8125, grad_fn=<MseLossBackward>)
output :  tensor([[124721.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(605806.8125, grad_fn=<MseLossBackward>)
output :  tensor([[196517.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(316.7288, grad_fn=<MseLossBackward>)
output :  tensor([[173710.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1414910.2500, grad_fn=<MseLossBackward>)
output :  tensor([[208324.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1658e+10, grad_fn=<MseLossBackward>)
output :  tensor([[210423.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(332118.0938, grad_fn=<MseLossBackward>)
output :  tensor([[164671.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1338e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193231.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1608933.7500, grad_fn=<MseLossBackward>)
output :  tensor([[113408.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(166770.1406, grad_fn=<MseLossBackward>)
output :  tensor([[115448.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(8696417., grad_fn=<MseLossBackward>)
output :  tensor([[110792.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(1457018.7500, grad_fn=<MseLossBackward>)
output :  tensor([[148967.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4699953., grad_fn=<MseLossBackward>)
output :  tensor([[158579.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3879e+10, grad_fn=<MseLossBackward>)
output :  tensor([[179724.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(75745.3594, grad_fn=<MseLossBackward>)
output :  tensor([[128311.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(659102.9375, grad_fn=<MseLossBackward>)
output :  tensor([[147393.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(5729066.5000, grad_fn=<MseLossBackward>)
output :  tensor([[180242.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0560e+09, grad_fn=<MseLossBackward>)
output :  tensor([[117773.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(763384.4375, grad_fn=<MseLossBackward>)
output :  tensor([[202263.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(27701966., grad_fn=<MseLossBackward>)
output :  tensor([[148816.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(14565434., grad_fn=<MseLossBackward>)
output :  tensor([[214877.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3911124.2500, grad_fn=<MseLossBackward>)
output :  tensor([[128043.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(4175541., grad_fn=<MseLossBackward>)
output :  tensor([[246455.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(3507953.5000, grad_fn=<MseLossBackward>)
output :  tensor([[237793.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2285e+09, grad_fn=<MseLossBackward>)
output :  tensor([[148126.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7979e+08, grad_fn=<MseLossBackward>)
output :  tensor([[84357.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4555e+08, grad_fn=<MseLossBackward>)
output :  tensor([[193466.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6315e+09, grad_fn=<MseLossBackward>)
output :  tensor([[79431.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2461712., grad_fn=<MseLossBackward>)
output :  tensor([[138920.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(335693.5000, grad_fn=<MseLossBackward>)
output :  tensor([[78204.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(7312841.5000, grad_fn=<MseLossBackward>)
output :  tensor([[143476.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(274019.5312, grad_fn=<MseLossBackward>)
output :  tensor([[177307.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1710291.7500, grad_fn=<MseLossBackward>)
output :  tensor([[153502.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(8.9065, grad_fn=<MseLossBackward>)
output :  tensor([[110020.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(6865874., grad_fn=<MseLossBackward>)
output :  tensor([[206607.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1912e+10, grad_fn=<MseLossBackward>)
output :  tensor([[128637.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(19031.0645, grad_fn=<MseLossBackward>)
output :  tensor([[267520.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5574e+08, grad_fn=<MseLossBackward>)
output :  tensor([[299292.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1466e+08, grad_fn=<MseLossBackward>)
output :  tensor([[108080.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(336844.2188, grad_fn=<MseLossBackward>)
output :  tensor([[169666.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(8029696.5000, grad_fn=<MseLossBackward>)
output :  tensor([[131834.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6806e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135905.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(9574286., grad_fn=<MseLossBackward>)
output :  tensor([[133110.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(8182907., grad_fn=<MseLossBackward>)
output :  tensor([[123055.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(3782569.2500, grad_fn=<MseLossBackward>)
output :  tensor([[133304.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6664e+08, grad_fn=<MseLossBackward>)
output :  tensor([[225520.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8998e+10, grad_fn=<MseLossBackward>)
output :  tensor([[189398.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2983e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145271.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1880798., grad_fn=<MseLossBackward>)
output :  tensor([[136149.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(74806280., grad_fn=<MseLossBackward>)
output :  tensor([[111655.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(164772.5625, grad_fn=<MseLossBackward>)
output :  tensor([[254064.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0956e+09, grad_fn=<MseLossBackward>)
output :  tensor([[133442.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2427120.5000, grad_fn=<MseLossBackward>)
output :  tensor([[201125.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3514570.5000, grad_fn=<MseLossBackward>)
output :  tensor([[104478.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(177945.5625, grad_fn=<MseLossBackward>)
output :  tensor([[140632.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(465763.5938, grad_fn=<MseLossBackward>)
output :  tensor([[205823.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4881e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179594.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(93101.2656, grad_fn=<MseLossBackward>)
output :  tensor([[185057.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3295.4775, grad_fn=<MseLossBackward>)
output :  tensor([[162254.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1534e+10, grad_fn=<MseLossBackward>)
output :  tensor([[304163.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(9.5092e+08, grad_fn=<MseLossBackward>)
output :  tensor([[195956.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3775795.5000, grad_fn=<MseLossBackward>)
output :  tensor([[257704.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1070e+10, grad_fn=<MseLossBackward>)
output :  tensor([[223067.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8432e+09, grad_fn=<MseLossBackward>)
output :  tensor([[286623.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2274e+08, grad_fn=<MseLossBackward>)
output :  tensor([[220665.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(11121391., grad_fn=<MseLossBackward>)
output :  tensor([[222218.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8826e+10, grad_fn=<MseLossBackward>)
output :  tensor([[203392.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(40867052., grad_fn=<MseLossBackward>)
output :  tensor([[158419.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(8.6550e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131162.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1789700.5000, grad_fn=<MseLossBackward>)
output :  tensor([[134858.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(411883.1875, grad_fn=<MseLossBackward>)
output :  tensor([[90600.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(159637.7031, grad_fn=<MseLossBackward>)
output :  tensor([[105266.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(7471509.5000, grad_fn=<MseLossBackward>)
output :  tensor([[276572.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7381e+09, grad_fn=<MseLossBackward>)
output :  tensor([[238598.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(12952464., grad_fn=<MseLossBackward>)
output :  tensor([[144197.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(644382.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138187.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(472398.4688, grad_fn=<MseLossBackward>)
output :  tensor([[174082.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(122073.8125, grad_fn=<MseLossBackward>)
output :  tensor([[151954.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(44954512., grad_fn=<MseLossBackward>)
output :  tensor([[162707.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0107e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166111.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1236196.5000, grad_fn=<MseLossBackward>)
output :  tensor([[136149.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(723483.1250, grad_fn=<MseLossBackward>)
output :  tensor([[188071.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2996e+09, grad_fn=<MseLossBackward>)
output :  tensor([[114477.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(6136535.5000, grad_fn=<MseLossBackward>)
output :  tensor([[170244.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(3082383.7500, grad_fn=<MseLossBackward>)
output :  tensor([[124509.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(20337704., grad_fn=<MseLossBackward>)
output :  tensor([[89097.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(4399244., grad_fn=<MseLossBackward>)
output :  tensor([[179110.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(791794.0625, grad_fn=<MseLossBackward>)
output :  tensor([[111161.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1591421.6250, grad_fn=<MseLossBackward>)
output :  tensor([[238749.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(62718.9414, grad_fn=<MseLossBackward>)
output :  tensor([[245812.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(660638.7500, grad_fn=<MseLossBackward>)
output :  tensor([[126732.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(7661694.5000, grad_fn=<MseLossBackward>)
output :  tensor([[110495.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(2360376., grad_fn=<MseLossBackward>)
output :  tensor([[288695.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2040e+10, grad_fn=<MseLossBackward>)
output :  tensor([[173017.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2303375.2500, grad_fn=<MseLossBackward>)
output :  tensor([[125516.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(266352.7500, grad_fn=<MseLossBackward>)
output :  tensor([[143074.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2872e+08, grad_fn=<MseLossBackward>)
output :  tensor([[201313.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6095e+08, grad_fn=<MseLossBackward>)
output :  tensor([[142082.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1172009.2500, grad_fn=<MseLossBackward>)
output :  tensor([[156643.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5217e+10, grad_fn=<MseLossBackward>)
output :  tensor([[152021.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(3527999.2500, grad_fn=<MseLossBackward>)
output :  tensor([[132695.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(10209423., grad_fn=<MseLossBackward>)
output :  tensor([[244473.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7963e+10, grad_fn=<MseLossBackward>)
output :  tensor([[402199.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(39688.1094, grad_fn=<MseLossBackward>)
output :  tensor([[112820.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(14593653., grad_fn=<MseLossBackward>)
output :  tensor([[113539.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(24607722., grad_fn=<MseLossBackward>)
output :  tensor([[157784.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2942243.2500, grad_fn=<MseLossBackward>)
output :  tensor([[131439.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0897e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163500.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4221e+09, grad_fn=<MseLossBackward>)
output :  tensor([[171409.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7711e+09, grad_fn=<MseLossBackward>)
output :  tensor([[107110.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(12324488., grad_fn=<MseLossBackward>)
output :  tensor([[141803.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(645260.7500, grad_fn=<MseLossBackward>)
output :  tensor([[360147.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(51072016., grad_fn=<MseLossBackward>)
output :  tensor([[202015.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7024e+09, grad_fn=<MseLossBackward>)
output :  tensor([[176537.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1076600.7500, grad_fn=<MseLossBackward>)
output :  tensor([[205652.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(7576514.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140719.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2956734., grad_fn=<MseLossBackward>)
output :  tensor([[193051.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2098242.7500, grad_fn=<MseLossBackward>)
output :  tensor([[136094.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1766e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179922.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1160433.8750, grad_fn=<MseLossBackward>)
output :  tensor([[236054.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(35347668., grad_fn=<MseLossBackward>)
output :  tensor([[173060.]], grad_fn=<AddmmBackward>)
loss:  tensor(883600., grad_fn=<MseLossBackward>)
output :  tensor([[110180.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(4754853., grad_fn=<MseLossBackward>)
output :  tensor([[266024.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2141649.2500, grad_fn=<MseLossBackward>)
output :  tensor([[256107.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(37300984., grad_fn=<MseLossBackward>)
output :  tensor([[124356.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1839541.2500, grad_fn=<MseLossBackward>)
output :  tensor([[217533.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3024e+09, grad_fn=<MseLossBackward>)
output :  tensor([[302972.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9854e+08, grad_fn=<MseLossBackward>)
output :  tensor([[206930.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(4878.1494, grad_fn=<MseLossBackward>)
output :  tensor([[212948.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6142e+10, grad_fn=<MseLossBackward>)
output :  tensor([[159294.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1943758.7500, grad_fn=<MseLossBackward>)
output :  tensor([[169098.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(795023., grad_fn=<MseLossBackward>)
output :  tensor([[164321.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(54610484., grad_fn=<MseLossBackward>)
output :  tensor([[172778.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(7717891.5000, grad_fn=<MseLossBackward>)
output :  tensor([[234769.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1043e+09, grad_fn=<MseLossBackward>)
output :  tensor([[216993.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5531e+08, grad_fn=<MseLossBackward>)
output :  tensor([[160005.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6913e+08, grad_fn=<MseLossBackward>)
output :  tensor([[122528.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(222481.7344, grad_fn=<MseLossBackward>)
output :  tensor([[175271.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2989170.7500, grad_fn=<MseLossBackward>)
output :  tensor([[180462.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3263e+09, grad_fn=<MseLossBackward>)
output :  tensor([[207273.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5098e+10, grad_fn=<MseLossBackward>)
output :  tensor([[137827.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(11527723., grad_fn=<MseLossBackward>)
output :  tensor([[148069.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0062e+08, grad_fn=<MseLossBackward>)
output :  tensor([[277196.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(38538.5977, grad_fn=<MseLossBackward>)
output :  tensor([[84032.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(935209.8750, grad_fn=<MseLossBackward>)
output :  tensor([[235642.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(735520.6250, grad_fn=<MseLossBackward>)
output :  tensor([[256643.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0646e+11, grad_fn=<MseLossBackward>)
output :  tensor([[170288.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(83439.7422, grad_fn=<MseLossBackward>)
output :  tensor([[193273.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7411e+09, grad_fn=<MseLossBackward>)
output :  tensor([[152359.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(6972818., grad_fn=<MseLossBackward>)
output :  tensor([[206888.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9831e+09, grad_fn=<MseLossBackward>)
output :  tensor([[128662.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(114191.1953, grad_fn=<MseLossBackward>)
output :  tensor([[142856.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(4593721.5000, grad_fn=<MseLossBackward>)
output :  tensor([[169546.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3151e+08, grad_fn=<MseLossBackward>)
output :  tensor([[183276.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(6623706.5000, grad_fn=<MseLossBackward>)
output :  tensor([[125353.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(418053.1562, grad_fn=<MseLossBackward>)
output :  tensor([[138326.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3335303.2500, grad_fn=<MseLossBackward>)
output :  tensor([[172689.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(96701.5625, grad_fn=<MseLossBackward>)
output :  tensor([[198720.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6296e+09, grad_fn=<MseLossBackward>)
output :  tensor([[238975.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(16193079., grad_fn=<MseLossBackward>)
output :  tensor([[153169.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(3349014.5000, grad_fn=<MseLossBackward>)
output :  tensor([[193205.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(7806698., grad_fn=<MseLossBackward>)
output :  tensor([[162889.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5681e+08, grad_fn=<MseLossBackward>)
output :  tensor([[183999.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(20245922., grad_fn=<MseLossBackward>)
output :  tensor([[179138.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(579549.1250, grad_fn=<MseLossBackward>)
output :  tensor([[96825.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(30482.9766, grad_fn=<MseLossBackward>)
output :  tensor([[172332.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1592e+10, grad_fn=<MseLossBackward>)
output :  tensor([[132993.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(4025352.5000, grad_fn=<MseLossBackward>)
output :  tensor([[120877.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(34541332., grad_fn=<MseLossBackward>)
output :  tensor([[174866.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(750876.4375, grad_fn=<MseLossBackward>)
output :  tensor([[85482.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(233236.1719, grad_fn=<MseLossBackward>)
output :  tensor([[287710.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(5240951.5000, grad_fn=<MseLossBackward>)
output :  tensor([[166730.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2993332.5000, grad_fn=<MseLossBackward>)
output :  tensor([[191227.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0147e+10, grad_fn=<MseLossBackward>)
output :  tensor([[245669.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4164e+08, grad_fn=<MseLossBackward>)
output :  tensor([[152743.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(3038103.5000, grad_fn=<MseLossBackward>)
output :  tensor([[124229.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(52451.7344, grad_fn=<MseLossBackward>)
output :  tensor([[119618.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(79193.8750, grad_fn=<MseLossBackward>)
output :  tensor([[144127.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4843e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172135.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(3477292.5000, grad_fn=<MseLossBackward>)
output :  tensor([[112498.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(8.9989e+08, grad_fn=<MseLossBackward>)
output :  tensor([[207349.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2243e+10, grad_fn=<MseLossBackward>)
output :  tensor([[235650.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(34211348., grad_fn=<MseLossBackward>)
output :  tensor([[252969.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0227e+10, grad_fn=<MseLossBackward>)
output :  tensor([[222577.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6971e+08, grad_fn=<MseLossBackward>)
output :  tensor([[196849.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4078e+10, grad_fn=<MseLossBackward>)
output :  tensor([[189640.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(4581138.5000, grad_fn=<MseLossBackward>)
output :  tensor([[204912.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8381e+10, grad_fn=<MseLossBackward>)
output :  tensor([[188910.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1635e+10, grad_fn=<MseLossBackward>)
output :  tensor([[175716.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(9142781., grad_fn=<MseLossBackward>)
output :  tensor([[153674.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2802485.2500, grad_fn=<MseLossBackward>)
output :  tensor([[331657.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(28540970., grad_fn=<MseLossBackward>)
output :  tensor([[210845.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1332545.6250, grad_fn=<MseLossBackward>)
output :  tensor([[159015.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(969394.0625, grad_fn=<MseLossBackward>)
output :  tensor([[187854.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8778e+09, grad_fn=<MseLossBackward>)
output :  tensor([[107478.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(6142381.5000, grad_fn=<MseLossBackward>)
output :  tensor([[274399.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8737e+10, grad_fn=<MseLossBackward>)
output :  tensor([[172292.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2583905.5000, grad_fn=<MseLossBackward>)
output :  tensor([[210082.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(11680374., grad_fn=<MseLossBackward>)
output :  tensor([[212647.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(69765824., grad_fn=<MseLossBackward>)
output :  tensor([[178434.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(585846.7500, grad_fn=<MseLossBackward>)
output :  tensor([[199519.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(5202747., grad_fn=<MseLossBackward>)
output :  tensor([[155302.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(91761.6641, grad_fn=<MseLossBackward>)
output :  tensor([[148835.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3849e+09, grad_fn=<MseLossBackward>)
output :  tensor([[118879.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(144032.1094, grad_fn=<MseLossBackward>)
output :  tensor([[139945.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2956.6406, grad_fn=<MseLossBackward>)
output :  tensor([[149788.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(622225.1875, grad_fn=<MseLossBackward>)
output :  tensor([[202384.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5779e+10, grad_fn=<MseLossBackward>)
output :  tensor([[160913.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1998247.2500, grad_fn=<MseLossBackward>)
output :  tensor([[100045.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(297698.1250, grad_fn=<MseLossBackward>)
output :  tensor([[224463.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4137e+08, grad_fn=<MseLossBackward>)
output :  tensor([[184487.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6054e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174833.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2727091., grad_fn=<MseLossBackward>)
output :  tensor([[85218.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(10358290., grad_fn=<MseLossBackward>)
output :  tensor([[132511.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(16093010., grad_fn=<MseLossBackward>)
output :  tensor([[214733.]], grad_fn=<AddmmBackward>)
loss:  tensor(537289., grad_fn=<MseLossBackward>)
output :  tensor([[143357.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(412725.9375, grad_fn=<MseLossBackward>)
output :  tensor([[134880.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(23814858., grad_fn=<MseLossBackward>)
output :  tensor([[142336.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(69210.1016, grad_fn=<MseLossBackward>)
output :  tensor([[178115.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6496e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146761.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(7624674., grad_fn=<MseLossBackward>)
output :  tensor([[160564.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(319030.8125, grad_fn=<MseLossBackward>)
output :  tensor([[216797.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3231568., grad_fn=<MseLossBackward>)
output :  tensor([[137401.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0498e+09, grad_fn=<MseLossBackward>)
output :  tensor([[256901.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(3614216.7500, grad_fn=<MseLossBackward>)
output :  tensor([[157847.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2730911.2500, grad_fn=<MseLossBackward>)
output :  tensor([[128866.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(134247.8125, grad_fn=<MseLossBackward>)
output :  tensor([[93577.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2022217.3750, grad_fn=<MseLossBackward>)
output :  tensor([[156305.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1561e+09, grad_fn=<MseLossBackward>)
output :  tensor([[180535.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(404396.6250, grad_fn=<MseLossBackward>)
output :  tensor([[123788.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(10816390., grad_fn=<MseLossBackward>)
output :  tensor([[189588.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5493e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145636.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3741e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151474.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2479345.5000, grad_fn=<MseLossBackward>)
output :  tensor([[188141.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(153284.4844, grad_fn=<MseLossBackward>)
output :  tensor([[251937.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6924e+09, grad_fn=<MseLossBackward>)
output :  tensor([[90218.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(1642943.1250, grad_fn=<MseLossBackward>)
output :  tensor([[239682.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(100657.4766, grad_fn=<MseLossBackward>)
output :  tensor([[126193.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(5320266.5000, grad_fn=<MseLossBackward>)
output :  tensor([[166059.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9681e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113441.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8067e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176910.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(829181., grad_fn=<MseLossBackward>)
output :  tensor([[163365.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7437e+08, grad_fn=<MseLossBackward>)
output :  tensor([[154072.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5567e+08, grad_fn=<MseLossBackward>)
output :  tensor([[239104.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(11018.4385, grad_fn=<MseLossBackward>)
output :  tensor([[226386.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9940e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128000.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(1000734.5000, grad_fn=<MseLossBackward>)
output :  tensor([[125361.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(407512.6562, grad_fn=<MseLossBackward>)
output :  tensor([[226531.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(219536.1719, grad_fn=<MseLossBackward>)
output :  tensor([[232374.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2642859.7500, grad_fn=<MseLossBackward>)
output :  tensor([[228339.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2689292.5000, grad_fn=<MseLossBackward>)
output :  tensor([[146978.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1043175., grad_fn=<MseLossBackward>)
output :  tensor([[215792.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(33548712., grad_fn=<MseLossBackward>)
output :  tensor([[130552.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1136e+08, grad_fn=<MseLossBackward>)
output :  tensor([[132487.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(167.3789, grad_fn=<MseLossBackward>)
output :  tensor([[308794.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(38502412., grad_fn=<MseLossBackward>)
output :  tensor([[144223.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(10389240., grad_fn=<MseLossBackward>)
output :  tensor([[119850.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7931e+09, grad_fn=<MseLossBackward>)
output :  tensor([[109764.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(70113.2500, grad_fn=<MseLossBackward>)
output :  tensor([[156220.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6503e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179237.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(9.1179e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173037.]], grad_fn=<AddmmBackward>)
loss:  tensor(1369., grad_fn=<MseLossBackward>)
output :  tensor([[192475.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(72661240., grad_fn=<MseLossBackward>)
output :  tensor([[94748.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(27580960., grad_fn=<MseLossBackward>)
output :  tensor([[177628.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1882255.3750, grad_fn=<MseLossBackward>)
output :  tensor([[168214.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(98674.5156, grad_fn=<MseLossBackward>)
output :  tensor([[140410.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1988584.7500, grad_fn=<MseLossBackward>)
output :  tensor([[259347.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9506e+09, grad_fn=<MseLossBackward>)
output :  tensor([[140843.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1185e+09, grad_fn=<MseLossBackward>)
output :  tensor([[169675.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(11049080., grad_fn=<MseLossBackward>)
output :  tensor([[141370.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1878998.3750, grad_fn=<MseLossBackward>)
output :  tensor([[202153.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2734424., grad_fn=<MseLossBackward>)
output :  tensor([[168628.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1880669.3750, grad_fn=<MseLossBackward>)
output :  tensor([[243729.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(73161.7969, grad_fn=<MseLossBackward>)
output :  tensor([[136759.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(5104422.5000, grad_fn=<MseLossBackward>)
output :  tensor([[150352.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1004035.3125, grad_fn=<MseLossBackward>)
output :  tensor([[213400.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2558100.2500, grad_fn=<MseLossBackward>)
output :  tensor([[166071.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1148313.1250, grad_fn=<MseLossBackward>)
output :  tensor([[188753.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(60569.8242, grad_fn=<MseLossBackward>)
output :  tensor([[133259.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6257e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128051.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(900334.1250, grad_fn=<MseLossBackward>)
output :  tensor([[146155.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(37891144., grad_fn=<MseLossBackward>)
output :  tensor([[198388.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0568e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166368.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6388e+09, grad_fn=<MseLossBackward>)
output :  tensor([[75728.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4740e+08, grad_fn=<MseLossBackward>)
output :  tensor([[93090.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(73795344., grad_fn=<MseLossBackward>)
output :  tensor([[255340.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(4191744.5000, grad_fn=<MseLossBackward>)
output :  tensor([[201907.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9573e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113671.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(1764434.8750, grad_fn=<MseLossBackward>)
output :  tensor([[157003.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(9.3001e+08, grad_fn=<MseLossBackward>)
output :  tensor([[209105.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1869e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177929.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4770e+09, grad_fn=<MseLossBackward>)
output :  tensor([[156535.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2358288., grad_fn=<MseLossBackward>)
output :  tensor([[167639.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(5569821.5000, grad_fn=<MseLossBackward>)
output :  tensor([[115693.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(481267.3750, grad_fn=<MseLossBackward>)
output :  tensor([[161195.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(38382864., grad_fn=<MseLossBackward>)
output :  tensor([[193010.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9293e+08, grad_fn=<MseLossBackward>)
output :  tensor([[217571.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(3720739.5000, grad_fn=<MseLossBackward>)
output :  tensor([[247953.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4706e+11, grad_fn=<MseLossBackward>)
output :  tensor([[146409.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(348524.1875, grad_fn=<MseLossBackward>)
output :  tensor([[108835.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(126552.5078, grad_fn=<MseLossBackward>)
output :  tensor([[168215.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8726e+08, grad_fn=<MseLossBackward>)
output :  tensor([[152792.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(5256631., grad_fn=<MseLossBackward>)
output :  tensor([[232863.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(17109856., grad_fn=<MseLossBackward>)
output :  tensor([[114087.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(832513.6875, grad_fn=<MseLossBackward>)
output :  tensor([[179627.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(10709256., grad_fn=<MseLossBackward>)
output :  tensor([[183376.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(11045237., grad_fn=<MseLossBackward>)
output :  tensor([[165193.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3965e+10, grad_fn=<MseLossBackward>)
output :  tensor([[95469.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0937e+08, grad_fn=<MseLossBackward>)
output :  tensor([[234688.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(18589166., grad_fn=<MseLossBackward>)
output :  tensor([[175763.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(56028.3711, grad_fn=<MseLossBackward>)
output :  tensor([[139881.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(14042.2500, grad_fn=<MseLossBackward>)
output :  tensor([[236130.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1277994.8750, grad_fn=<MseLossBackward>)
output :  tensor([[161820.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1392141.8750, grad_fn=<MseLossBackward>)
output :  tensor([[202056.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5115e+10, grad_fn=<MseLossBackward>)
output :  tensor([[136130.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1278136.2500, grad_fn=<MseLossBackward>)
output :  tensor([[187094.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2972e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137043.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1088761.8750, grad_fn=<MseLossBackward>)
output :  tensor([[227518.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(71931072., grad_fn=<MseLossBackward>)
output :  tensor([[226574.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4877e+08, grad_fn=<MseLossBackward>)
output :  tensor([[89962.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(1413.8774, grad_fn=<MseLossBackward>)
output :  tensor([[157680.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(3075693.7500, grad_fn=<MseLossBackward>)
output :  tensor([[245673.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5676e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145795.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(633193.1875, grad_fn=<MseLossBackward>)
output :  tensor([[111452.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9760e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164515.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(237.8342, grad_fn=<MseLossBackward>)
output :  tensor([[143772.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(51976.8750, grad_fn=<MseLossBackward>)
output :  tensor([[129232.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1065765.8750, grad_fn=<MseLossBackward>)
output :  tensor([[189661.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8079e+09, grad_fn=<MseLossBackward>)
output :  tensor([[124393.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(3585904.5000, grad_fn=<MseLossBackward>)
output :  tensor([[150469.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2343865.2500, grad_fn=<MseLossBackward>)
output :  tensor([[169576.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(4724306., grad_fn=<MseLossBackward>)
output :  tensor([[153560.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(6558641., grad_fn=<MseLossBackward>)
output :  tensor([[159151.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(14051838., grad_fn=<MseLossBackward>)
output :  tensor([[136012.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2969e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133629.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2656136., grad_fn=<MseLossBackward>)
output :  tensor([[153307.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0472e+08, grad_fn=<MseLossBackward>)
output :  tensor([[142685.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2150439., grad_fn=<MseLossBackward>)
output :  tensor([[166698.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(24491674., grad_fn=<MseLossBackward>)
output :  tensor([[137469.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6008e+08, grad_fn=<MseLossBackward>)
output :  tensor([[151086.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(5228725.5000, grad_fn=<MseLossBackward>)
output :  tensor([[187013.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(973089.7500, grad_fn=<MseLossBackward>)
output :  tensor([[169162.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(26421.4863, grad_fn=<MseLossBackward>)
output :  tensor([[179915.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(7061.2510, grad_fn=<MseLossBackward>)
output :  tensor([[220222.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(49492.3438, grad_fn=<MseLossBackward>)
output :  tensor([[110369.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(6100630., grad_fn=<MseLossBackward>)
output :  tensor([[136922.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4454e+08, grad_fn=<MseLossBackward>)
output :  tensor([[285391.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(370462.4375, grad_fn=<MseLossBackward>)
output :  tensor([[116601.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(362225.3125, grad_fn=<MseLossBackward>)
output :  tensor([[175446.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9850e+09, grad_fn=<MseLossBackward>)
output :  tensor([[179158.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(34124036., grad_fn=<MseLossBackward>)
output :  tensor([[178474.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(49351284., grad_fn=<MseLossBackward>)
output :  tensor([[249622.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4400e+08, grad_fn=<MseLossBackward>)
output :  tensor([[221513.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(236408.6719, grad_fn=<MseLossBackward>)
output :  tensor([[126231.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1338e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174153.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4745e+08, grad_fn=<MseLossBackward>)
output :  tensor([[124160.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(25883.2793, grad_fn=<MseLossBackward>)
output :  tensor([[185882.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3957e+10, grad_fn=<MseLossBackward>)
output :  tensor([[156720.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(13838633., grad_fn=<MseLossBackward>)
output :  tensor([[154609.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(65766016., grad_fn=<MseLossBackward>)
output :  tensor([[205523.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(603146.3750, grad_fn=<MseLossBackward>)
output :  tensor([[144958.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5520e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176206.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(42648.7031, grad_fn=<MseLossBackward>)
output :  tensor([[248628.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(9.5305e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148545.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(297467.9688, grad_fn=<MseLossBackward>)
output :  tensor([[202195.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(220709.1094, grad_fn=<MseLossBackward>)
output :  tensor([[163593.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(13274068., grad_fn=<MseLossBackward>)
output :  tensor([[120521.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0577e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136331.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(338487.5938, grad_fn=<MseLossBackward>)
output :  tensor([[177461.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(42746464., grad_fn=<MseLossBackward>)
output :  tensor([[199070.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(82281056., grad_fn=<MseLossBackward>)
output :  tensor([[231681.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2854e+09, grad_fn=<MseLossBackward>)
output :  tensor([[259477.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(6137774., grad_fn=<MseLossBackward>)
output :  tensor([[187257.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7356e+10, grad_fn=<MseLossBackward>)
output :  tensor([[142704.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6219e+09, grad_fn=<MseLossBackward>)
output :  tensor([[147448.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(8691533., grad_fn=<MseLossBackward>)
output :  tensor([[71476.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9079e+08, grad_fn=<MseLossBackward>)
output :  tensor([[132014.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(8915916., grad_fn=<MseLossBackward>)
output :  tensor([[124717.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(17494810., grad_fn=<MseLossBackward>)
output :  tensor([[155571.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2470349., grad_fn=<MseLossBackward>)
output :  tensor([[133711.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(45050316., grad_fn=<MseLossBackward>)
output :  tensor([[77246.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(556574.3125, grad_fn=<MseLossBackward>)
output :  tensor([[80597.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(1967335., grad_fn=<MseLossBackward>)
output :  tensor([[231253.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(556725.8125, grad_fn=<MseLossBackward>)
output :  tensor([[140940.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0886e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129138.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(1855022.7500, grad_fn=<MseLossBackward>)
output :  tensor([[166577.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(178572.2656, grad_fn=<MseLossBackward>)
output :  tensor([[235878.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(771844.6250, grad_fn=<MseLossBackward>)
output :  tensor([[189700.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(5952837.5000, grad_fn=<MseLossBackward>)
output :  tensor([[154032.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(3872839.5000, grad_fn=<MseLossBackward>)
output :  tensor([[199371.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2165818., grad_fn=<MseLossBackward>)
output :  tensor([[201076.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2905e+09, grad_fn=<MseLossBackward>)
output :  tensor([[135900.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1208453.6250, grad_fn=<MseLossBackward>)
output :  tensor([[153716.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1648294.8750, grad_fn=<MseLossBackward>)
output :  tensor([[134798.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1442551.1250, grad_fn=<MseLossBackward>)
output :  tensor([[197173.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0776e+09, grad_fn=<MseLossBackward>)
output :  tensor([[156035.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(4144596.2500, grad_fn=<MseLossBackward>)
output :  tensor([[137552.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9406e+09, grad_fn=<MseLossBackward>)
output :  tensor([[142839.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4247206., grad_fn=<MseLossBackward>)
output :  tensor([[206996.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(25035012., grad_fn=<MseLossBackward>)
output :  tensor([[102343.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1385e+08, grad_fn=<MseLossBackward>)
output :  tensor([[168934.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2056893.7500, grad_fn=<MseLossBackward>)
output :  tensor([[128933.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(871670.2500, grad_fn=<MseLossBackward>)
output :  tensor([[145668.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1772143.3750, grad_fn=<MseLossBackward>)
output :  tensor([[107916.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0733e+09, grad_fn=<MseLossBackward>)
output :  tensor([[135195.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(5312449., grad_fn=<MseLossBackward>)
output :  tensor([[232700.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(10885463., grad_fn=<MseLossBackward>)
output :  tensor([[145408.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(166706.3438, grad_fn=<MseLossBackward>)
output :  tensor([[140820.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(11023334., grad_fn=<MseLossBackward>)
output :  tensor([[166000.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4440e+09, grad_fn=<MseLossBackward>)
output :  tensor([[269648.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(69752248., grad_fn=<MseLossBackward>)
output :  tensor([[180687.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(32352634., grad_fn=<MseLossBackward>)
output :  tensor([[104766.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3963770., grad_fn=<MseLossBackward>)
output :  tensor([[200460.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9351e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161335.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(5452444., grad_fn=<MseLossBackward>)
output :  tensor([[164444.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5361e+10, grad_fn=<MseLossBackward>)
output :  tensor([[97317.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(965582.6250, grad_fn=<MseLossBackward>)
output :  tensor([[122456.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(1306824.1250, grad_fn=<MseLossBackward>)
output :  tensor([[155972.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(742.5625, grad_fn=<MseLossBackward>)
output :  tensor([[144842.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(23446478., grad_fn=<MseLossBackward>)
output :  tensor([[198297.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2899517.2500, grad_fn=<MseLossBackward>)
output :  tensor([[140461.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2365876.5000, grad_fn=<MseLossBackward>)
output :  tensor([[261734.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(298081.8750, grad_fn=<MseLossBackward>)
output :  tensor([[126261.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1063e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166153.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(426939.7188, grad_fn=<MseLossBackward>)
output :  tensor([[187614.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(783861.2500, grad_fn=<MseLossBackward>)
output :  tensor([[120630.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1302e+08, grad_fn=<MseLossBackward>)
output :  tensor([[252334.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(5449015., grad_fn=<MseLossBackward>)
output :  tensor([[159795.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4008e+08, grad_fn=<MseLossBackward>)
output :  tensor([[242652.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(7275073.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144712.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(507389.0938, grad_fn=<MseLossBackward>)
output :  tensor([[211801.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(3246021.5000, grad_fn=<MseLossBackward>)
output :  tensor([[176934.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(20560840., grad_fn=<MseLossBackward>)
output :  tensor([[153651.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(121299.8281, grad_fn=<MseLossBackward>)
output :  tensor([[123313.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(28232202., grad_fn=<MseLossBackward>)
output :  tensor([[238740.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3377e+09, grad_fn=<MseLossBackward>)
output :  tensor([[238946.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1108841.8750, grad_fn=<MseLossBackward>)
output :  tensor([[151253.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(4340256., grad_fn=<MseLossBackward>)
output :  tensor([[254877.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(523.2656, grad_fn=<MseLossBackward>)
output :  tensor([[121834.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(53733480., grad_fn=<MseLossBackward>)
output :  tensor([[176219.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(48386.2500, grad_fn=<MseLossBackward>)
output :  tensor([[162678.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(7174027.5000, grad_fn=<MseLossBackward>)
output :  tensor([[133939.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(8642498., grad_fn=<MseLossBackward>)
output :  tensor([[194105.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1738e+09, grad_fn=<MseLossBackward>)
output :  tensor([[165500.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2252907.2500, grad_fn=<MseLossBackward>)
output :  tensor([[161771.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1508751.6250, grad_fn=<MseLossBackward>)
output :  tensor([[158989.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(978244.6250, grad_fn=<MseLossBackward>)
output :  tensor([[146191.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(13754942., grad_fn=<MseLossBackward>)
output :  tensor([[170832.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7616e+09, grad_fn=<MseLossBackward>)
output :  tensor([[160269.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(72849.3828, grad_fn=<MseLossBackward>)
output :  tensor([[380442.]], grad_fn=<AddmmBackward>)
loss:  tensor(12446784., grad_fn=<MseLossBackward>)
output :  tensor([[134124.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(50755828., grad_fn=<MseLossBackward>)
output :  tensor([[130619.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0358e+09, grad_fn=<MseLossBackward>)
output :  tensor([[284654.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(11840911., grad_fn=<MseLossBackward>)
output :  tensor([[164003.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(4013949.7500, grad_fn=<MseLossBackward>)
output :  tensor([[133462.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6802e+08, grad_fn=<MseLossBackward>)
output :  tensor([[226056.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(35323336., grad_fn=<MseLossBackward>)
output :  tensor([[184113.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(13058060., grad_fn=<MseLossBackward>)
output :  tensor([[154310.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(5340432., grad_fn=<MseLossBackward>)
output :  tensor([[142930.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4284382.5000, grad_fn=<MseLossBackward>)
output :  tensor([[152969.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5824e+08, grad_fn=<MseLossBackward>)
output :  tensor([[100100.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(10035.9697, grad_fn=<MseLossBackward>)
output :  tensor([[76662.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7763e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163709.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1664382.2500, grad_fn=<MseLossBackward>)
output :  tensor([[187947.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6042e+09, grad_fn=<MseLossBackward>)
output :  tensor([[155955.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(4181386., grad_fn=<MseLossBackward>)
output :  tensor([[153947.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(12618591., grad_fn=<MseLossBackward>)
output :  tensor([[136821.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(394501.7500, grad_fn=<MseLossBackward>)
output :  tensor([[206234.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(81162.6719, grad_fn=<MseLossBackward>)
output :  tensor([[139826.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(3334675.5000, grad_fn=<MseLossBackward>)
output :  tensor([[182321.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6302e+10, grad_fn=<MseLossBackward>)
output :  tensor([[147977.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3908899.7500, grad_fn=<MseLossBackward>)
output :  tensor([[109715.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1369e+08, grad_fn=<MseLossBackward>)
output :  tensor([[96065.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(4266710., grad_fn=<MseLossBackward>)
output :  tensor([[172784.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(4906432.5000, grad_fn=<MseLossBackward>)
output :  tensor([[263095.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(7267236.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140921.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(334517.6250, grad_fn=<MseLossBackward>)
output :  tensor([[160893.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(996097.5625, grad_fn=<MseLossBackward>)
output :  tensor([[133096.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(355830.9062, grad_fn=<MseLossBackward>)
output :  tensor([[154359.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(23614892., grad_fn=<MseLossBackward>)
output :  tensor([[168764.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(748143.9375, grad_fn=<MseLossBackward>)
output :  tensor([[128444.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2087754.1250, grad_fn=<MseLossBackward>)
output :  tensor([[171404.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9718e+08, grad_fn=<MseLossBackward>)
output :  tensor([[155450.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2400030.2500, grad_fn=<MseLossBackward>)
output :  tensor([[118844.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(5496057.5000, grad_fn=<MseLossBackward>)
output :  tensor([[160238.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2943e+09, grad_fn=<MseLossBackward>)
output :  tensor([[56441.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(19725256., grad_fn=<MseLossBackward>)
output :  tensor([[234198.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1311e+09, grad_fn=<MseLossBackward>)
output :  tensor([[199438.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2439502.2500, grad_fn=<MseLossBackward>)
output :  tensor([[183770.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1512823.1250, grad_fn=<MseLossBackward>)
output :  tensor([[107100.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(1210395.3750, grad_fn=<MseLossBackward>)
output :  tensor([[88319.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(1742131.8750, grad_fn=<MseLossBackward>)
output :  tensor([[141414.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2000545., grad_fn=<MseLossBackward>)
output :  tensor([[220665.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3780e+09, grad_fn=<MseLossBackward>)
output :  tensor([[203769.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(13914648., grad_fn=<MseLossBackward>)
output :  tensor([[168945.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(15569436., grad_fn=<MseLossBackward>)
output :  tensor([[173666.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3418e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193427.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(11746899., grad_fn=<MseLossBackward>)
output :  tensor([[87821.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(675375.8125, grad_fn=<MseLossBackward>)
output :  tensor([[139931.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(4730.8604, grad_fn=<MseLossBackward>)
output :  tensor([[112472.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3889153.7500, grad_fn=<MseLossBackward>)
output :  tensor([[148399.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5473e+08, grad_fn=<MseLossBackward>)
output :  tensor([[170477.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5585e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193438.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3366e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178855.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1310917.6250, grad_fn=<MseLossBackward>)
output :  tensor([[97394.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(800172.1875, grad_fn=<MseLossBackward>)
output :  tensor([[116263.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1529627.8750, grad_fn=<MseLossBackward>)
output :  tensor([[160437.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5521e+08, grad_fn=<MseLossBackward>)
output :  tensor([[199171.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(686101.6250, grad_fn=<MseLossBackward>)
output :  tensor([[143246.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(567103.1250, grad_fn=<MseLossBackward>)
train_loss: [2.6016527e+09]
epoch_result tensor([0.])
output :  tensor([[158487.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(155.8596, grad_fn=<MseLossBackward>)
output :  tensor([[123165.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1358098.8750, grad_fn=<MseLossBackward>)
output :  tensor([[193072.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1272489.7500, grad_fn=<MseLossBackward>)
output :  tensor([[179223.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(4945481., grad_fn=<MseLossBackward>)
output :  tensor([[154409.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5652e+08, grad_fn=<MseLossBackward>)
output :  tensor([[123223.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(22818162., grad_fn=<MseLossBackward>)
output :  tensor([[141392.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(153823.2969, grad_fn=<MseLossBackward>)
output :  tensor([[119700.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(491138.1562, grad_fn=<MseLossBackward>)
output :  tensor([[69786.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2739e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165245.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(569576.8125, grad_fn=<MseLossBackward>)
output :  tensor([[139533.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(217680.5625, grad_fn=<MseLossBackward>)
output :  tensor([[225491.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(241879.5312, grad_fn=<MseLossBackward>)
output :  tensor([[166864.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(4561027.5000, grad_fn=<MseLossBackward>)
output :  tensor([[254165.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(19939852., grad_fn=<MseLossBackward>)
output :  tensor([[58801.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(14451402., grad_fn=<MseLossBackward>)
output :  tensor([[160518.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5659e+08, grad_fn=<MseLossBackward>)
output :  tensor([[185902.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1886e+08, grad_fn=<MseLossBackward>)
output :  tensor([[153635.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(8204733.5000, grad_fn=<MseLossBackward>)
output :  tensor([[272543.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(6034546., grad_fn=<MseLossBackward>)
output :  tensor([[196673.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(106898.3438, grad_fn=<MseLossBackward>)
output :  tensor([[138644.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4997e+10, grad_fn=<MseLossBackward>)
output :  tensor([[194627.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(559878.0625, grad_fn=<MseLossBackward>)
output :  tensor([[179095.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0981e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151993.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(987073.3125, grad_fn=<MseLossBackward>)
output :  tensor([[171471.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2164484.5000, grad_fn=<MseLossBackward>)
output :  tensor([[89377.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(15819636., grad_fn=<MseLossBackward>)
output :  tensor([[170384.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2930e+09, grad_fn=<MseLossBackward>)
output :  tensor([[185413.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(170801.3906, grad_fn=<MseLossBackward>)
output :  tensor([[206333.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4173e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113434.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(11793644., grad_fn=<MseLossBackward>)
output :  tensor([[170391.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(370044.0938, grad_fn=<MseLossBackward>)
output :  tensor([[138887.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(5701126., grad_fn=<MseLossBackward>)
output :  tensor([[126033.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(8797480., grad_fn=<MseLossBackward>)
output :  tensor([[121033.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(2352700.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144895.]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7813e+08, grad_fn=<MseLossBackward>)
output :  tensor([[168892.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1347e+10, grad_fn=<MseLossBackward>)
output :  tensor([[152197.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(6237974.5000, grad_fn=<MseLossBackward>)
output :  tensor([[179565.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(188817.4062, grad_fn=<MseLossBackward>)
output :  tensor([[142636.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2679155.2500, grad_fn=<MseLossBackward>)
output :  tensor([[101891.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4141e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136015.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2385e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137223.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4945759., grad_fn=<MseLossBackward>)
output :  tensor([[135178.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(66887352., grad_fn=<MseLossBackward>)
output :  tensor([[227386.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(5693443.5000, grad_fn=<MseLossBackward>)
output :  tensor([[132487.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(56257.9102, grad_fn=<MseLossBackward>)
output :  tensor([[147253.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(3050862.7500, grad_fn=<MseLossBackward>)
output :  tensor([[109716.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(5216335., grad_fn=<MseLossBackward>)
output :  tensor([[158563.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2064250.5000, grad_fn=<MseLossBackward>)
output :  tensor([[141342.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8791e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194587.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(6697663., grad_fn=<MseLossBackward>)
output :  tensor([[134600.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(22598.5449, grad_fn=<MseLossBackward>)
output :  tensor([[111219.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1486646.7500, grad_fn=<MseLossBackward>)
output :  tensor([[232623.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1893548., grad_fn=<MseLossBackward>)
output :  tensor([[165912.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2636e+09, grad_fn=<MseLossBackward>)
output :  tensor([[155162.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(14728925., grad_fn=<MseLossBackward>)
output :  tensor([[204539.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8211e+10, grad_fn=<MseLossBackward>)
output :  tensor([[247229.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1400e+10, grad_fn=<MseLossBackward>)
output :  tensor([[146581.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(9493428., grad_fn=<MseLossBackward>)
output :  tensor([[132327.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2795740.7500, grad_fn=<MseLossBackward>)
output :  tensor([[159461.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(19906238., grad_fn=<MseLossBackward>)
output :  tensor([[135446.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(29666574., grad_fn=<MseLossBackward>)
output :  tensor([[180283.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3547e+09, grad_fn=<MseLossBackward>)
output :  tensor([[183881.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(47612.6055, grad_fn=<MseLossBackward>)
output :  tensor([[165739.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(17974686., grad_fn=<MseLossBackward>)
output :  tensor([[136727.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(39343864., grad_fn=<MseLossBackward>)
output :  tensor([[143325.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(682043.6875, grad_fn=<MseLossBackward>)
output :  tensor([[149011.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(16093010., grad_fn=<MseLossBackward>)
output :  tensor([[173116.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4315e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193312.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6111e+08, grad_fn=<MseLossBackward>)
output :  tensor([[139067.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(6590612., grad_fn=<MseLossBackward>)
output :  tensor([[171627.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(74120.0625, grad_fn=<MseLossBackward>)
output :  tensor([[175554.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(29656022., grad_fn=<MseLossBackward>)
output :  tensor([[116679.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(2822321.2500, grad_fn=<MseLossBackward>)
output :  tensor([[216531.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(19968888., grad_fn=<MseLossBackward>)
output :  tensor([[187341.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(14757722., grad_fn=<MseLossBackward>)
output :  tensor([[129768.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(18222360., grad_fn=<MseLossBackward>)
output :  tensor([[192078.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(19548556., grad_fn=<MseLossBackward>)
output :  tensor([[177552.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(7034927.5000, grad_fn=<MseLossBackward>)
output :  tensor([[209755.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1150e+10, grad_fn=<MseLossBackward>)
output :  tensor([[210113.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(785245.1875, grad_fn=<MseLossBackward>)
output :  tensor([[166843.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2847e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193298.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1443114.1250, grad_fn=<MseLossBackward>)
output :  tensor([[111398.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(2563576.2500, grad_fn=<MseLossBackward>)
output :  tensor([[115893.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(11516903., grad_fn=<MseLossBackward>)
output :  tensor([[112770.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(593670.2500, grad_fn=<MseLossBackward>)
output :  tensor([[145117.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2832278.7500, grad_fn=<MseLossBackward>)
output :  tensor([[160089.]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3326e+10, grad_fn=<MseLossBackward>)
output :  tensor([[181830.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(3351702.7500, grad_fn=<MseLossBackward>)
output :  tensor([[127275.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(50424.8086, grad_fn=<MseLossBackward>)
output :  tensor([[146184.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1402522.1250, grad_fn=<MseLossBackward>)
output :  tensor([[182742.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2889e+09, grad_fn=<MseLossBackward>)
output :  tensor([[117838.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(879873.3125, grad_fn=<MseLossBackward>)
output :  tensor([[193366.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(13201187., grad_fn=<MseLossBackward>)
output :  tensor([[146270.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1613813., grad_fn=<MseLossBackward>)
output :  tensor([[213863.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(929265.8750, grad_fn=<MseLossBackward>)
output :  tensor([[126563.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(317884.5312, grad_fn=<MseLossBackward>)
output :  tensor([[248012.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(99668.4609, grad_fn=<MseLossBackward>)
output :  tensor([[240322.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9961e+09, grad_fn=<MseLossBackward>)
output :  tensor([[147615.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6293e+08, grad_fn=<MseLossBackward>)
output :  tensor([[86977.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7484e+08, grad_fn=<MseLossBackward>)
output :  tensor([[194057.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5354e+09, grad_fn=<MseLossBackward>)
output :  tensor([[84101.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(9618188., grad_fn=<MseLossBackward>)
output :  tensor([[141935.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(5931356., grad_fn=<MseLossBackward>)
output :  tensor([[77296.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(3228394.7500, grad_fn=<MseLossBackward>)
output :  tensor([[144747.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(3221015.5000, grad_fn=<MseLossBackward>)
output :  tensor([[177029.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1059516.3750, grad_fn=<MseLossBackward>)
output :  tensor([[153210.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(84000.3438, grad_fn=<MseLossBackward>)
output :  tensor([[106723.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(457958.8438, grad_fn=<MseLossBackward>)
output :  tensor([[202841.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2748e+10, grad_fn=<MseLossBackward>)
output :  tensor([[126865.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2672407.5000, grad_fn=<MseLossBackward>)
output :  tensor([[269331.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1381e+08, grad_fn=<MseLossBackward>)
output :  tensor([[304912.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(25886154., grad_fn=<MseLossBackward>)
output :  tensor([[110002.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(6260786., grad_fn=<MseLossBackward>)
output :  tensor([[171324.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1381763.5000, grad_fn=<MseLossBackward>)
output :  tensor([[133996.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7583e+08, grad_fn=<MseLossBackward>)
output :  tensor([[142479.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(12103767., grad_fn=<MseLossBackward>)
output :  tensor([[133219.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(8817373., grad_fn=<MseLossBackward>)
output :  tensor([[126711.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(2929473., grad_fn=<MseLossBackward>)
output :  tensor([[134009.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0072e+08, grad_fn=<MseLossBackward>)
output :  tensor([[226775.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8504e+10, grad_fn=<MseLossBackward>)
output :  tensor([[190333.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2700e+10, grad_fn=<MseLossBackward>)
output :  tensor([[142249.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2723840.7500, grad_fn=<MseLossBackward>)
output :  tensor([[130394.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(8377090., grad_fn=<MseLossBackward>)
output :  tensor([[110318.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(866906.5000, grad_fn=<MseLossBackward>)
output :  tensor([[256098.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8393e+09, grad_fn=<MseLossBackward>)
output :  tensor([[135974.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(948858.6250, grad_fn=<MseLossBackward>)
output :  tensor([[203214.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(45936.5469, grad_fn=<MseLossBackward>)
output :  tensor([[109131.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(17906320., grad_fn=<MseLossBackward>)
output :  tensor([[140295.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(119089.6953, grad_fn=<MseLossBackward>)
output :  tensor([[207543.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8752e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181734.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(3363613.2500, grad_fn=<MseLossBackward>)
output :  tensor([[184329.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(449528.3438, grad_fn=<MseLossBackward>)
output :  tensor([[161983.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1614e+10, grad_fn=<MseLossBackward>)
output :  tensor([[300502.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1901e+09, grad_fn=<MseLossBackward>)
output :  tensor([[197271.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(394756.9688, grad_fn=<MseLossBackward>)
output :  tensor([[258882.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0730e+10, grad_fn=<MseLossBackward>)
output :  tensor([[221803.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9534e+09, grad_fn=<MseLossBackward>)
output :  tensor([[280666.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3202e+09, grad_fn=<MseLossBackward>)
output :  tensor([[225212.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1469701.6250, grad_fn=<MseLossBackward>)
output :  tensor([[224309.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8120e+10, grad_fn=<MseLossBackward>)
output :  tensor([[194823.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(4738444.5000, grad_fn=<MseLossBackward>)
output :  tensor([[160088.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6652e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133859.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1849430., grad_fn=<MseLossBackward>)
output :  tensor([[136173.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(453202.4375, grad_fn=<MseLossBackward>)
output :  tensor([[91274.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(75586.3359, grad_fn=<MseLossBackward>)
output :  tensor([[109551.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2406909.7500, grad_fn=<MseLossBackward>)
output :  tensor([[273169.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1059e+09, grad_fn=<MseLossBackward>)
output :  tensor([[231810.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(10172811., grad_fn=<MseLossBackward>)
output :  tensor([[147434.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(5927551., grad_fn=<MseLossBackward>)
output :  tensor([[135571.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3717726.2500, grad_fn=<MseLossBackward>)
output :  tensor([[170483.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(10559453., grad_fn=<MseLossBackward>)
output :  tensor([[145191.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(3442.3889, grad_fn=<MseLossBackward>)
output :  tensor([[166480.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8509e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165811.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(658633.6875, grad_fn=<MseLossBackward>)
output :  tensor([[141979.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(24796666., grad_fn=<MseLossBackward>)
output :  tensor([[190370.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6064e+09, grad_fn=<MseLossBackward>)
output :  tensor([[115611.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(13039829., grad_fn=<MseLossBackward>)
output :  tensor([[176880.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(23820652., grad_fn=<MseLossBackward>)
output :  tensor([[120984.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(969424.8750, grad_fn=<MseLossBackward>)
output :  tensor([[87776.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(603061.4375, grad_fn=<MseLossBackward>)
output :  tensor([[180135.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(18229.2188, grad_fn=<MseLossBackward>)
output :  tensor([[109370.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(280635.0625, grad_fn=<MseLossBackward>)
output :  tensor([[240906.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3635219., grad_fn=<MseLossBackward>)
output :  tensor([[244445.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(307435.5938, grad_fn=<MseLossBackward>)
output :  tensor([[133823.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(18694274., grad_fn=<MseLossBackward>)
output :  tensor([[109629.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(449790.2812, grad_fn=<MseLossBackward>)
output :  tensor([[289833.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1703e+10, grad_fn=<MseLossBackward>)
output :  tensor([[172910.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1988188.1250, grad_fn=<MseLossBackward>)
output :  tensor([[119453.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(30759242., grad_fn=<MseLossBackward>)
output :  tensor([[144346.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9414e+08, grad_fn=<MseLossBackward>)
output :  tensor([[198956.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2631e+08, grad_fn=<MseLossBackward>)
output :  tensor([[140053.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(895625.6250, grad_fn=<MseLossBackward>)
output :  tensor([[157623.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4976e+10, grad_fn=<MseLossBackward>)
output :  tensor([[154438.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(289763.5312, grad_fn=<MseLossBackward>)
output :  tensor([[128563.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(876929.8125, grad_fn=<MseLossBackward>)
output :  tensor([[248987.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6773e+10, grad_fn=<MseLossBackward>)
output :  tensor([[394551.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(55476428., grad_fn=<MseLossBackward>)
output :  tensor([[110543.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(2383767.2500, grad_fn=<MseLossBackward>)
output :  tensor([[122393.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(15159342., grad_fn=<MseLossBackward>)
output :  tensor([[158335.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1355005.1250, grad_fn=<MseLossBackward>)
output :  tensor([[132172.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7642e+08, grad_fn=<MseLossBackward>)
output :  tensor([[160970.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7246e+09, grad_fn=<MseLossBackward>)
output :  tensor([[170165.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6199e+09, grad_fn=<MseLossBackward>)
output :  tensor([[106601.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(9008815., grad_fn=<MseLossBackward>)
output :  tensor([[139050.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(3800123.7500, grad_fn=<MseLossBackward>)
output :  tensor([[367141.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(23275.3164, grad_fn=<MseLossBackward>)
output :  tensor([[206459.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2601e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173069.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(5905583.5000, grad_fn=<MseLossBackward>)
output :  tensor([[194375.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(72663640., grad_fn=<MseLossBackward>)
output :  tensor([[140015.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1031970.2500, grad_fn=<MseLossBackward>)
output :  tensor([[194505.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(35.4397, grad_fn=<MseLossBackward>)
output :  tensor([[135872.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0498e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180447.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(305066.3438, grad_fn=<MseLossBackward>)
output :  tensor([[240180.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(3311547., grad_fn=<MseLossBackward>)
output :  tensor([[177388.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(11480767., grad_fn=<MseLossBackward>)
output :  tensor([[108636.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(404774.3125, grad_fn=<MseLossBackward>)
output :  tensor([[264870.]], grad_fn=<AddmmBackward>)
loss:  tensor(95481., grad_fn=<MseLossBackward>)
output :  tensor([[248980.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1039571.4375, grad_fn=<MseLossBackward>)
output :  tensor([[117521.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(30009168., grad_fn=<MseLossBackward>)
output :  tensor([[215928.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4894e+09, grad_fn=<MseLossBackward>)
output :  tensor([[304734.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2292e+08, grad_fn=<MseLossBackward>)
output :  tensor([[207828.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(686023.9375, grad_fn=<MseLossBackward>)
output :  tensor([[214137.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5841e+10, grad_fn=<MseLossBackward>)
output :  tensor([[158369.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(220753.1562, grad_fn=<MseLossBackward>)
output :  tensor([[170733.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(552861.9375, grad_fn=<MseLossBackward>)
output :  tensor([[160380.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(11893445., grad_fn=<MseLossBackward>)
output :  tensor([[165769.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(17896734., grad_fn=<MseLossBackward>)
output :  tensor([[236865.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6934e+08, grad_fn=<MseLossBackward>)
output :  tensor([[220848.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(74086904., grad_fn=<MseLossBackward>)
output :  tensor([[161268.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0358e+08, grad_fn=<MseLossBackward>)
output :  tensor([[123921.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(848298.5625, grad_fn=<MseLossBackward>)
output :  tensor([[178092.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1193317.2500, grad_fn=<MseLossBackward>)
output :  tensor([[179189.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5303e+09, grad_fn=<MseLossBackward>)
output :  tensor([[206968.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5212e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134653.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(49145.3477, grad_fn=<MseLossBackward>)
output :  tensor([[148936.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4728e+08, grad_fn=<MseLossBackward>)
output :  tensor([[273470.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(12454723., grad_fn=<MseLossBackward>)
output :  tensor([[90586.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(31211688., grad_fn=<MseLossBackward>)
output :  tensor([[233811.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(7230553., grad_fn=<MseLossBackward>)
output :  tensor([[259612.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0454e+11, grad_fn=<MseLossBackward>)
output :  tensor([[168000.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3998375.2500, grad_fn=<MseLossBackward>)
output :  tensor([[194455.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6438e+09, grad_fn=<MseLossBackward>)
output :  tensor([[154222.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(604069., grad_fn=<MseLossBackward>)
output :  tensor([[205363.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1779e+09, grad_fn=<MseLossBackward>)
output :  tensor([[130708.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(2920120.2500, grad_fn=<MseLossBackward>)
output :  tensor([[152073.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(50040812., grad_fn=<MseLossBackward>)
output :  tensor([[169552.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3184e+08, grad_fn=<MseLossBackward>)
output :  tensor([[186966.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1246188.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128843.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(8083049., grad_fn=<MseLossBackward>)
output :  tensor([[137491.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(982669.5000, grad_fn=<MseLossBackward>)
output :  tensor([[176529.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(12457811., grad_fn=<MseLossBackward>)
output :  tensor([[197177.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7902e+09, grad_fn=<MseLossBackward>)
output :  tensor([[239780.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(10363068., grad_fn=<MseLossBackward>)
output :  tensor([[154004.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(991518.0625, grad_fn=<MseLossBackward>)
output :  tensor([[202382.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(40739496., grad_fn=<MseLossBackward>)
output :  tensor([[160477.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7150e+08, grad_fn=<MseLossBackward>)
output :  tensor([[184483.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(24831690., grad_fn=<MseLossBackward>)
output :  tensor([[184278.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(19173042., grad_fn=<MseLossBackward>)
output :  tensor([[97356.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(127404.3750, grad_fn=<MseLossBackward>)
output :  tensor([[172153.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1631e+10, grad_fn=<MseLossBackward>)
output :  tensor([[135745.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(555234.5625, grad_fn=<MseLossBackward>)
output :  tensor([[120922.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(35073136., grad_fn=<MseLossBackward>)
output :  tensor([[170028.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(15772440., grad_fn=<MseLossBackward>)
output :  tensor([[85080.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(6531.9229, grad_fn=<MseLossBackward>)
output :  tensor([[286963.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(9219763., grad_fn=<MseLossBackward>)
output :  tensor([[167438.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(5947882.5000, grad_fn=<MseLossBackward>)
output :  tensor([[191947.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9943e+10, grad_fn=<MseLossBackward>)
output :  tensor([[245933.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2833e+08, grad_fn=<MseLossBackward>)
output :  tensor([[151802.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(644156.7500, grad_fn=<MseLossBackward>)
output :  tensor([[121099.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(8414079., grad_fn=<MseLossBackward>)
output :  tensor([[124607.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(22164160., grad_fn=<MseLossBackward>)
output :  tensor([[143545.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1485e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172285.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2937956.7500, grad_fn=<MseLossBackward>)
output :  tensor([[112162.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7987e+08, grad_fn=<MseLossBackward>)
output :  tensor([[208760.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1933e+10, grad_fn=<MseLossBackward>)
output :  tensor([[238007.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(12195264., grad_fn=<MseLossBackward>)
output :  tensor([[251067.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0772e+10, grad_fn=<MseLossBackward>)
output :  tensor([[220739.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3343e+08, grad_fn=<MseLossBackward>)
output :  tensor([[194452.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4653e+10, grad_fn=<MseLossBackward>)
output :  tensor([[188101.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(361407.6250, grad_fn=<MseLossBackward>)
output :  tensor([[205708.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8032e+10, grad_fn=<MseLossBackward>)
output :  tensor([[188119.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1869e+10, grad_fn=<MseLossBackward>)
output :  tensor([[175425.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(10988707., grad_fn=<MseLossBackward>)
output :  tensor([[151925.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(5596.9102, grad_fn=<MseLossBackward>)
output :  tensor([[335763.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1527927.7500, grad_fn=<MseLossBackward>)
output :  tensor([[210745.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1573652.6250, grad_fn=<MseLossBackward>)
output :  tensor([[162349.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(5519269., grad_fn=<MseLossBackward>)
output :  tensor([[186523.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0224e+09, grad_fn=<MseLossBackward>)
output :  tensor([[105315.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(99579.6875, grad_fn=<MseLossBackward>)
output :  tensor([[269644.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1428e+10, grad_fn=<MseLossBackward>)
output :  tensor([[170756.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(9884441., grad_fn=<MseLossBackward>)
output :  tensor([[211911.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2523878.2500, grad_fn=<MseLossBackward>)
output :  tensor([[210773.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0459e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178041.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1341651.6250, grad_fn=<MseLossBackward>)
output :  tensor([[199244.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(6530101., grad_fn=<MseLossBackward>)
output :  tensor([[155981.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(962391.6875, grad_fn=<MseLossBackward>)
output :  tensor([[149959.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4960e+09, grad_fn=<MseLossBackward>)
output :  tensor([[119082.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(338915., grad_fn=<MseLossBackward>)
output :  tensor([[141729.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2990143.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144981.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(16148719., grad_fn=<MseLossBackward>)
output :  tensor([[199099.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6615e+10, grad_fn=<MseLossBackward>)
output :  tensor([[159513.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(178.4729, grad_fn=<MseLossBackward>)
output :  tensor([[101464.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(3857510.7500, grad_fn=<MseLossBackward>)
output :  tensor([[224747.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3263e+08, grad_fn=<MseLossBackward>)
output :  tensor([[185714.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0863e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174704.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(3171682.7500, grad_fn=<MseLossBackward>)
output :  tensor([[82611.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(373378.2812, grad_fn=<MseLossBackward>)
output :  tensor([[130120.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(2626298.7500, grad_fn=<MseLossBackward>)
output :  tensor([[211338.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(7082833.5000, grad_fn=<MseLossBackward>)
output :  tensor([[141883.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(4479440., grad_fn=<MseLossBackward>)
output :  tensor([[130705.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(497443.6875, grad_fn=<MseLossBackward>)
output :  tensor([[147098.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(20233128., grad_fn=<MseLossBackward>)
output :  tensor([[176528.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5232e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146519.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(6350321.5000, grad_fn=<MseLossBackward>)
output :  tensor([[160268.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(72008.3672, grad_fn=<MseLossBackward>)
output :  tensor([[213272.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2984742.2500, grad_fn=<MseLossBackward>)
output :  tensor([[134676.]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8066e+08, grad_fn=<MseLossBackward>)
output :  tensor([[252349.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(7026227., grad_fn=<MseLossBackward>)
output :  tensor([[158553.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(896453.9375, grad_fn=<MseLossBackward>)
output :  tensor([[128847.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(120669.3906, grad_fn=<MseLossBackward>)
output :  tensor([[95419.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(176098.2500, grad_fn=<MseLossBackward>)
output :  tensor([[153041.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6980e+09, grad_fn=<MseLossBackward>)
output :  tensor([[178490.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1987879.7500, grad_fn=<MseLossBackward>)
output :  tensor([[119643.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(734194.6250, grad_fn=<MseLossBackward>)
output :  tensor([[187743.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6979e+09, grad_fn=<MseLossBackward>)
output :  tensor([[143492.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0950e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150947.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1098173., grad_fn=<MseLossBackward>)
output :  tensor([[186566.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1401449., grad_fn=<MseLossBackward>)
output :  tensor([[253674.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5525e+09, grad_fn=<MseLossBackward>)
output :  tensor([[92083.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(339916.3438, grad_fn=<MseLossBackward>)
output :  tensor([[239985.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(209.3447, grad_fn=<MseLossBackward>)
output :  tensor([[127966.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(284563.9062, grad_fn=<MseLossBackward>)
output :  tensor([[164331.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0316e+10, grad_fn=<MseLossBackward>)
output :  tensor([[112182.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4842e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176098.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(9674.5664, grad_fn=<MseLossBackward>)
output :  tensor([[163417.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7685e+08, grad_fn=<MseLossBackward>)
output :  tensor([[154948.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9774e+08, grad_fn=<MseLossBackward>)
output :  tensor([[237668.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1773058.7500, grad_fn=<MseLossBackward>)
output :  tensor([[223262.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2067e+09, grad_fn=<MseLossBackward>)
output :  tensor([[126438.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(315361.2188, grad_fn=<MseLossBackward>)
output :  tensor([[131868.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(34439660., grad_fn=<MseLossBackward>)
output :  tensor([[225393.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2579587.2500, grad_fn=<MseLossBackward>)
output :  tensor([[230341.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(13382336., grad_fn=<MseLossBackward>)
output :  tensor([[225361.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1791665.8750, grad_fn=<MseLossBackward>)
output :  tensor([[150502.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(6262584.5000, grad_fn=<MseLossBackward>)
output :  tensor([[211275.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1626820.5000, grad_fn=<MseLossBackward>)
output :  tensor([[131742.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3790e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135806.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(10931909., grad_fn=<MseLossBackward>)
output :  tensor([[311459.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(12535583., grad_fn=<MseLossBackward>)
output :  tensor([[139155.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(3400681.7500, grad_fn=<MseLossBackward>)
output :  tensor([[120678.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8814e+09, grad_fn=<MseLossBackward>)
output :  tensor([[108920.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(335268.1562, grad_fn=<MseLossBackward>)
output :  tensor([[155524.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8816e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178552.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2491e+09, grad_fn=<MseLossBackward>)
output :  tensor([[172399.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(360975.6562, grad_fn=<MseLossBackward>)
output :  tensor([[192163.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(78090632., grad_fn=<MseLossBackward>)
output :  tensor([[103119.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(9729964., grad_fn=<MseLossBackward>)
output :  tensor([[180023.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1048480., grad_fn=<MseLossBackward>)
output :  tensor([[172429.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(20513964., grad_fn=<MseLossBackward>)
output :  tensor([[137901.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1206565., grad_fn=<MseLossBackward>)
output :  tensor([[261674.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(9.4917e+09, grad_fn=<MseLossBackward>)
output :  tensor([[140617.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0933e+09, grad_fn=<MseLossBackward>)
output :  tensor([[175441.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(5961609., grad_fn=<MseLossBackward>)
output :  tensor([[139371.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(395228.3125, grad_fn=<MseLossBackward>)
output :  tensor([[197261.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(10487477., grad_fn=<MseLossBackward>)
output :  tensor([[170415.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(173030., grad_fn=<MseLossBackward>)
output :  tensor([[242847.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1328328.2500, grad_fn=<MseLossBackward>)
output :  tensor([[132985.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2295177.7500, grad_fn=<MseLossBackward>)
output :  tensor([[150552.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1445517.7500, grad_fn=<MseLossBackward>)
output :  tensor([[212420.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(6655594., grad_fn=<MseLossBackward>)
output :  tensor([[162351.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(7013145.5000, grad_fn=<MseLossBackward>)
output :  tensor([[194458.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(29792322., grad_fn=<MseLossBackward>)
output :  tensor([[132417.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0665e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128970.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(842.3599, grad_fn=<MseLossBackward>)
output :  tensor([[138531.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2155666.2500, grad_fn=<MseLossBackward>)
output :  tensor([[200605.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7465e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166119.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6132e+09, grad_fn=<MseLossBackward>)
output :  tensor([[73138.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7263e+08, grad_fn=<MseLossBackward>)
output :  tensor([[91365.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(47137236., grad_fn=<MseLossBackward>)
output :  tensor([[249758.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(12495341., grad_fn=<MseLossBackward>)
output :  tensor([[204281.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2617e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113990.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(1018948.3125, grad_fn=<MseLossBackward>)
output :  tensor([[157507.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(8.9957e+08, grad_fn=<MseLossBackward>)
output :  tensor([[208034.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4318e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180954.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9291e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158482.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(12128350., grad_fn=<MseLossBackward>)
output :  tensor([[169656.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(117702.6016, grad_fn=<MseLossBackward>)
output :  tensor([[115830.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(690444.1250, grad_fn=<MseLossBackward>)
output :  tensor([[160693.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(32418078., grad_fn=<MseLossBackward>)
output :  tensor([[192763.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9985e+08, grad_fn=<MseLossBackward>)
output :  tensor([[218918.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(338305.8125, grad_fn=<MseLossBackward>)
output :  tensor([[247630.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4738e+11, grad_fn=<MseLossBackward>)
output :  tensor([[143404.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(12924250., grad_fn=<MseLossBackward>)
output :  tensor([[110530.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(4204358., grad_fn=<MseLossBackward>)
output :  tensor([[169708.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4864e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148748.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(3066986., grad_fn=<MseLossBackward>)
output :  tensor([[235149.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(3424292.5000, grad_fn=<MseLossBackward>)
output :  tensor([[113110.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(3571509.5000, grad_fn=<MseLossBackward>)
output :  tensor([[177799.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(26014782., grad_fn=<MseLossBackward>)
output :  tensor([[187876.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1383894.8750, grad_fn=<MseLossBackward>)
output :  tensor([[163488.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4496e+10, grad_fn=<MseLossBackward>)
output :  tensor([[97105.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5938e+08, grad_fn=<MseLossBackward>)
output :  tensor([[239013.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(173.9102, grad_fn=<MseLossBackward>)
output :  tensor([[177546.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2390309.2500, grad_fn=<MseLossBackward>)
output :  tensor([[140359.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(129318.9062, grad_fn=<MseLossBackward>)
output :  tensor([[234375.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(390136.8750, grad_fn=<MseLossBackward>)
output :  tensor([[163667.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(445326.8125, grad_fn=<MseLossBackward>)
output :  tensor([[204737.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4463e+10, grad_fn=<MseLossBackward>)
output :  tensor([[135643.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(414655.5000, grad_fn=<MseLossBackward>)
output :  tensor([[186736.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1189e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133867.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(4547689.5000, grad_fn=<MseLossBackward>)
output :  tensor([[227032.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(80416336., grad_fn=<MseLossBackward>)
output :  tensor([[224602.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4501e+08, grad_fn=<MseLossBackward>)
output :  tensor([[91501.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2254502.2500, grad_fn=<MseLossBackward>)
output :  tensor([[158623.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(656150.6250, grad_fn=<MseLossBackward>)
output :  tensor([[248235.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5041e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144291.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(501551.6562, grad_fn=<MseLossBackward>)
output :  tensor([[110853.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9231e+09, grad_fn=<MseLossBackward>)
output :  tensor([[162971.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2337220., grad_fn=<MseLossBackward>)
output :  tensor([[145794.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(3221071.5000, grad_fn=<MseLossBackward>)
output :  tensor([[126879.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1742853.7500, grad_fn=<MseLossBackward>)
output :  tensor([[188856.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9201e+09, grad_fn=<MseLossBackward>)
output :  tensor([[122023.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(227171.3906, grad_fn=<MseLossBackward>)
output :  tensor([[156765.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(22713714., grad_fn=<MseLossBackward>)
output :  tensor([[170402.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1815798.3750, grad_fn=<MseLossBackward>)
output :  tensor([[147028.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(15769089., grad_fn=<MseLossBackward>)
output :  tensor([[162244.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(429168.2812, grad_fn=<MseLossBackward>)
output :  tensor([[134091.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2956e+08, grad_fn=<MseLossBackward>)
output :  tensor([[132255.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(65440.0352, grad_fn=<MseLossBackward>)
output :  tensor([[154748.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4802e+08, grad_fn=<MseLossBackward>)
output :  tensor([[143910.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(58096.0625, grad_fn=<MseLossBackward>)
output :  tensor([[162963.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1473492.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138878.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3973e+08, grad_fn=<MseLossBackward>)
output :  tensor([[147012.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(3196888.2500, grad_fn=<MseLossBackward>)
output :  tensor([[188965.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(931405.9375, grad_fn=<MseLossBackward>)
output :  tensor([[171387.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(5699186.5000, grad_fn=<MseLossBackward>)
output :  tensor([[181364.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1860623.8750, grad_fn=<MseLossBackward>)
output :  tensor([[220967.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(936872.7500, grad_fn=<MseLossBackward>)
output :  tensor([[111841.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(15536100., grad_fn=<MseLossBackward>)
output :  tensor([[136961.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4549e+08, grad_fn=<MseLossBackward>)
output :  tensor([[286179.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(32186.6016, grad_fn=<MseLossBackward>)
output :  tensor([[118280.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(5201749.5000, grad_fn=<MseLossBackward>)
output :  tensor([[179138.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6697e+09, grad_fn=<MseLossBackward>)
output :  tensor([[187422.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(5868885., grad_fn=<MseLossBackward>)
output :  tensor([[195065.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(91496400., grad_fn=<MseLossBackward>)
output :  tensor([[251300.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6169e+08, grad_fn=<MseLossBackward>)
output :  tensor([[226495.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(20208536., grad_fn=<MseLossBackward>)
output :  tensor([[127901.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8405e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176047.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3118e+08, grad_fn=<MseLossBackward>)
output :  tensor([[123844.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(24189.9688, grad_fn=<MseLossBackward>)
output :  tensor([[184581.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4617e+10, grad_fn=<MseLossBackward>)
output :  tensor([[153483.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(233908.2500, grad_fn=<MseLossBackward>)
output :  tensor([[154204.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(59362452., grad_fn=<MseLossBackward>)
output :  tensor([[205972.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(107266.4844, grad_fn=<MseLossBackward>)
output :  tensor([[147331.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1998e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174333.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2776961.7500, grad_fn=<MseLossBackward>)
output :  tensor([[252439.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3228e+08, grad_fn=<MseLossBackward>)
output :  tensor([[147619.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(144495.0156, grad_fn=<MseLossBackward>)
output :  tensor([[200864.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(3241012.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163107.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(9971681., grad_fn=<MseLossBackward>)
output :  tensor([[121477.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1207e+09, grad_fn=<MseLossBackward>)
output :  tensor([[132513.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(10475337., grad_fn=<MseLossBackward>)
output :  tensor([[181508.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(6207650., grad_fn=<MseLossBackward>)
output :  tensor([[195456.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(29771688., grad_fn=<MseLossBackward>)
output :  tensor([[231608.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2937e+09, grad_fn=<MseLossBackward>)
output :  tensor([[252783.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(17779662., grad_fn=<MseLossBackward>)
output :  tensor([[188220.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7103e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144587.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8183e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145333.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(695321.4375, grad_fn=<MseLossBackward>)
output :  tensor([[70742.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(9.4512e+08, grad_fn=<MseLossBackward>)
output :  tensor([[143755.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(76663432., grad_fn=<MseLossBackward>)
output :  tensor([[131550.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(7026144., grad_fn=<MseLossBackward>)
output :  tensor([[155272.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1619335.7500, grad_fn=<MseLossBackward>)
output :  tensor([[130318.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(11014724., grad_fn=<MseLossBackward>)
output :  tensor([[75089.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(1988915.2500, grad_fn=<MseLossBackward>)
output :  tensor([[84449.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(6000662.5000, grad_fn=<MseLossBackward>)
output :  tensor([[244116.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4680e+08, grad_fn=<MseLossBackward>)
output :  tensor([[140555.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8709e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134030.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(12464872., grad_fn=<MseLossBackward>)
output :  tensor([[172338.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(28495912., grad_fn=<MseLossBackward>)
output :  tensor([[231675.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(11055209., grad_fn=<MseLossBackward>)
output :  tensor([[190001.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(4571912.5000, grad_fn=<MseLossBackward>)
output :  tensor([[158607.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(6800360., grad_fn=<MseLossBackward>)
output :  tensor([[195716.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(4769515., grad_fn=<MseLossBackward>)
output :  tensor([[203367.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1311e+09, grad_fn=<MseLossBackward>)
output :  tensor([[135161.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(3380599.2500, grad_fn=<MseLossBackward>)
output :  tensor([[156298.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1685412.5000, grad_fn=<MseLossBackward>)
output :  tensor([[137593.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2538893.7500, grad_fn=<MseLossBackward>)
output :  tensor([[198111.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0169e+09, grad_fn=<MseLossBackward>)
output :  tensor([[152449.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2405261.7500, grad_fn=<MseLossBackward>)
output :  tensor([[140034.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1655e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146235.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1784186.3750, grad_fn=<MseLossBackward>)
output :  tensor([[209479.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(6351109., grad_fn=<MseLossBackward>)
output :  tensor([[101831.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9327e+08, grad_fn=<MseLossBackward>)
output :  tensor([[169498.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3994002.2500, grad_fn=<MseLossBackward>)
output :  tensor([[126695.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1701964.8750, grad_fn=<MseLossBackward>)
output :  tensor([[145396.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2572014., grad_fn=<MseLossBackward>)
output :  tensor([[106738.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9674e+09, grad_fn=<MseLossBackward>)
output :  tensor([[141148.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(13309272., grad_fn=<MseLossBackward>)
output :  tensor([[237717.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2950343., grad_fn=<MseLossBackward>)
output :  tensor([[143880.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1253035.3750, grad_fn=<MseLossBackward>)
output :  tensor([[139051.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2407782.5000, grad_fn=<MseLossBackward>)
output :  tensor([[164190.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3098e+09, grad_fn=<MseLossBackward>)
output :  tensor([[271761.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(38924340., grad_fn=<MseLossBackward>)
output :  tensor([[176391.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1937620.5000, grad_fn=<MseLossBackward>)
output :  tensor([[105938.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(10003581., grad_fn=<MseLossBackward>)
output :  tensor([[202091.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6865e+09, grad_fn=<MseLossBackward>)
output :  tensor([[156862.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(4567570.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163027.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5967e+10, grad_fn=<MseLossBackward>)
output :  tensor([[101159.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(8175891.5000, grad_fn=<MseLossBackward>)
output :  tensor([[124893.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(1672677.3750, grad_fn=<MseLossBackward>)
output :  tensor([[158470.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(6104991.5000, grad_fn=<MseLossBackward>)
output :  tensor([[141135.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1290105.5000, grad_fn=<MseLossBackward>)
output :  tensor([[200990.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(981121.1875, grad_fn=<MseLossBackward>)
output :  tensor([[142491.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(241664.4219, grad_fn=<MseLossBackward>)
output :  tensor([[266386.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(16860776., grad_fn=<MseLossBackward>)
output :  tensor([[128631.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2696e+09, grad_fn=<MseLossBackward>)
output :  tensor([[165750.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(62617.2422, grad_fn=<MseLossBackward>)
output :  tensor([[188607.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(11620.1660, grad_fn=<MseLossBackward>)
output :  tensor([[123937.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9424e+08, grad_fn=<MseLossBackward>)
output :  tensor([[247833.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(4692503.5000, grad_fn=<MseLossBackward>)
output :  tensor([[158886.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9038e+08, grad_fn=<MseLossBackward>)
output :  tensor([[243798.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2405649.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144578.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(335005.8125, grad_fn=<MseLossBackward>)
output :  tensor([[212308.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(5330110., grad_fn=<MseLossBackward>)
output :  tensor([[176769.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(19089526., grad_fn=<MseLossBackward>)
output :  tensor([[152824.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1382351.3750, grad_fn=<MseLossBackward>)
output :  tensor([[118932.]], grad_fn=<AddmmBackward>)
loss:  tensor(868624., grad_fn=<MseLossBackward>)
output :  tensor([[239029.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3098e+09, grad_fn=<MseLossBackward>)
output :  tensor([[239601.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(159138.6562, grad_fn=<MseLossBackward>)
output :  tensor([[151044.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(5254410., grad_fn=<MseLossBackward>)
output :  tensor([[255451.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(304548.7812, grad_fn=<MseLossBackward>)
output :  tensor([[124267.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(95325168., grad_fn=<MseLossBackward>)
output :  tensor([[176536.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(287815.5000, grad_fn=<MseLossBackward>)
output :  tensor([[159758.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(58178.9492, grad_fn=<MseLossBackward>)
output :  tensor([[128874.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(4519178.5000, grad_fn=<MseLossBackward>)
output :  tensor([[193923.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1504e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163639.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(129780.0625, grad_fn=<MseLossBackward>)
output :  tensor([[167374.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(19137618., grad_fn=<MseLossBackward>)
output :  tensor([[156225.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3147131.5000, grad_fn=<MseLossBackward>)
output :  tensor([[151362.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2138997.7500, grad_fn=<MseLossBackward>)
output :  tensor([[171852.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8879e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159347.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(425246.6250, grad_fn=<MseLossBackward>)
output :  tensor([[377846.]], grad_fn=<AddmmBackward>)
loss:  tensor(37503376., grad_fn=<MseLossBackward>)
output :  tensor([[122531.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(19968818., grad_fn=<MseLossBackward>)
output :  tensor([[129772.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9601e+09, grad_fn=<MseLossBackward>)
output :  tensor([[275931.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(27897874., grad_fn=<MseLossBackward>)
output :  tensor([[161181.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(670070.1250, grad_fn=<MseLossBackward>)
output :  tensor([[129825.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(86962912., grad_fn=<MseLossBackward>)
output :  tensor([[235033.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(9204966., grad_fn=<MseLossBackward>)
output :  tensor([[178225.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(5171431.5000, grad_fn=<MseLossBackward>)
output :  tensor([[154454.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(6023880., grad_fn=<MseLossBackward>)
output :  tensor([[145900.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(811603.9375, grad_fn=<MseLossBackward>)
output :  tensor([[155802.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5731e+08, grad_fn=<MseLossBackward>)
output :  tensor([[100447.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(200424.0938, grad_fn=<MseLossBackward>)
output :  tensor([[75065.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2698e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163754.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1551815.2500, grad_fn=<MseLossBackward>)
output :  tensor([[188150.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5880e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157480.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(269474.5312, grad_fn=<MseLossBackward>)
output :  tensor([[160566.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(9403326., grad_fn=<MseLossBackward>)
output :  tensor([[139744.]], grad_fn=<AddmmBackward>)
loss:  tensor(5262436., grad_fn=<MseLossBackward>)
output :  tensor([[209044.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(9575157., grad_fn=<MseLossBackward>)
output :  tensor([[140134.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(4556090., grad_fn=<MseLossBackward>)
output :  tensor([[181817.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6431e+10, grad_fn=<MseLossBackward>)
output :  tensor([[142890.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(9670254., grad_fn=<MseLossBackward>)
output :  tensor([[110612.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6246e+08, grad_fn=<MseLossBackward>)
output :  tensor([[92572.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(2036975.6250, grad_fn=<MseLossBackward>)
output :  tensor([[174423.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(332604.5312, grad_fn=<MseLossBackward>)
output :  tensor([[254742.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(32010136., grad_fn=<MseLossBackward>)
output :  tensor([[142238.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(545128.4375, grad_fn=<MseLossBackward>)
output :  tensor([[156168.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(13889830., grad_fn=<MseLossBackward>)
output :  tensor([[132751.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(63260.1094, grad_fn=<MseLossBackward>)
output :  tensor([[148947.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(305239., grad_fn=<MseLossBackward>)
output :  tensor([[168596.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(485003.4375, grad_fn=<MseLossBackward>)
output :  tensor([[126557.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(195433.0625, grad_fn=<MseLossBackward>)
output :  tensor([[173441.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0889e+08, grad_fn=<MseLossBackward>)
output :  tensor([[157757.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(574540.3125, grad_fn=<MseLossBackward>)
output :  tensor([[117670.]], grad_fn=<AddmmBackward>)
loss:  tensor(1368900., grad_fn=<MseLossBackward>)
output :  tensor([[159541.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3961e+09, grad_fn=<MseLossBackward>)
output :  tensor([[52750.5820]], grad_fn=<AddmmBackward>)
loss:  tensor(563373.3750, grad_fn=<MseLossBackward>)
output :  tensor([[235168.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9802e+09, grad_fn=<MseLossBackward>)
output :  tensor([[197732.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(10679211., grad_fn=<MseLossBackward>)
output :  tensor([[183768.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1516823.1250, grad_fn=<MseLossBackward>)
output :  tensor([[108005.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(4020244.2500, grad_fn=<MseLossBackward>)
output :  tensor([[88710.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2925436., grad_fn=<MseLossBackward>)
output :  tensor([[135550.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(19797076., grad_fn=<MseLossBackward>)
output :  tensor([[222820.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0665e+09, grad_fn=<MseLossBackward>)
output :  tensor([[204605.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(8380572.5000, grad_fn=<MseLossBackward>)
output :  tensor([[164394.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(366743.7812, grad_fn=<MseLossBackward>)
output :  tensor([[173145.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4373e+09, grad_fn=<MseLossBackward>)
output :  tensor([[191318.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1739637.3750, grad_fn=<MseLossBackward>)
output :  tensor([[90915.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(15331140., grad_fn=<MseLossBackward>)
output :  tensor([[140643.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(414373.8438, grad_fn=<MseLossBackward>)
output :  tensor([[111853.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1831623.8750, grad_fn=<MseLossBackward>)
output :  tensor([[144759.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(77432576., grad_fn=<MseLossBackward>)
output :  tensor([[171846.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6685e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195257.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(94915696., grad_fn=<MseLossBackward>)
output :  tensor([[180652.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(425307.7812, grad_fn=<MseLossBackward>)
output :  tensor([[96509.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(88.7717, grad_fn=<MseLossBackward>)
output :  tensor([[117460.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(1539.9492, grad_fn=<MseLossBackward>)
output :  tensor([[160718.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4204e+08, grad_fn=<MseLossBackward>)
output :  tensor([[199441.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(311608.1875, grad_fn=<MseLossBackward>)
output :  tensor([[143589.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(168779.7500, grad_fn=<MseLossBackward>)
train_loss: [2.5974433e+09]
epoch_result tensor([0.])
output :  tensor([[158310.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(35774.1758, grad_fn=<MseLossBackward>)
output :  tensor([[121114.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(784027.2500, grad_fn=<MseLossBackward>)
output :  tensor([[197458.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(10611204., grad_fn=<MseLossBackward>)
output :  tensor([[179660.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(7080671.5000, grad_fn=<MseLossBackward>)
output :  tensor([[154259.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6359e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128816.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(666672.2500, grad_fn=<MseLossBackward>)
output :  tensor([[141039.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1567.6650, grad_fn=<MseLossBackward>)
output :  tensor([[118462.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(289074.2500, grad_fn=<MseLossBackward>)
output :  tensor([[65928.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(55179132., grad_fn=<MseLossBackward>)
output :  tensor([[165559.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(194095.3125, grad_fn=<MseLossBackward>)
output :  tensor([[148515.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(72512408., grad_fn=<MseLossBackward>)
output :  tensor([[223989.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1021552.3750, grad_fn=<MseLossBackward>)
output :  tensor([[168083.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(839113.2500, grad_fn=<MseLossBackward>)
output :  tensor([[246260.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(11830698., grad_fn=<MseLossBackward>)
output :  tensor([[54315.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(468754.1875, grad_fn=<MseLossBackward>)
output :  tensor([[161329.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8322e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175671.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(450366.8125, grad_fn=<MseLossBackward>)
output :  tensor([[172515.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5649e+08, grad_fn=<MseLossBackward>)
output :  tensor([[276520.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2311445., grad_fn=<MseLossBackward>)
output :  tensor([[195486.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2290351.2500, grad_fn=<MseLossBackward>)
output :  tensor([[135097.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6952e+10, grad_fn=<MseLossBackward>)
output :  tensor([[195255.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1895741.7500, grad_fn=<MseLossBackward>)
output :  tensor([[178873.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1185e+09, grad_fn=<MseLossBackward>)
output :  tensor([[152588.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2523431.5000, grad_fn=<MseLossBackward>)
output :  tensor([[169706.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(86362.5156, grad_fn=<MseLossBackward>)
output :  tensor([[85289.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(12141.2852, grad_fn=<MseLossBackward>)
output :  tensor([[171520.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4247e+09, grad_fn=<MseLossBackward>)
output :  tensor([[185425.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(180983.7656, grad_fn=<MseLossBackward>)
output :  tensor([[204853.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5651e+09, grad_fn=<MseLossBackward>)
output :  tensor([[108924.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1156599.3750, grad_fn=<MseLossBackward>)
output :  tensor([[171616.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(379590.7500, grad_fn=<MseLossBackward>)
output :  tensor([[138102.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2569208.2500, grad_fn=<MseLossBackward>)
output :  tensor([[128817.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(33320.5078, grad_fn=<MseLossBackward>)
output :  tensor([[119872.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(138494.4531, grad_fn=<MseLossBackward>)
output :  tensor([[146022.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4231e+08, grad_fn=<MseLossBackward>)
output :  tensor([[168995.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1317e+10, grad_fn=<MseLossBackward>)
output :  tensor([[151739.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(4158795.5000, grad_fn=<MseLossBackward>)
output :  tensor([[183105.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(9644421., grad_fn=<MseLossBackward>)
output :  tensor([[144325.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(11059470., grad_fn=<MseLossBackward>)
output :  tensor([[104563.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1211e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137706.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9742e+09, grad_fn=<MseLossBackward>)
output :  tensor([[134631.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(136011.1406, grad_fn=<MseLossBackward>)
output :  tensor([[137634.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1308e+08, grad_fn=<MseLossBackward>)
output :  tensor([[225140.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(19604.3750, grad_fn=<MseLossBackward>)
output :  tensor([[133669.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2014093.1250, grad_fn=<MseLossBackward>)
output :  tensor([[148453.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(298662.2500, grad_fn=<MseLossBackward>)
output :  tensor([[113893.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(3585549.2500, grad_fn=<MseLossBackward>)
output :  tensor([[160858.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(736754., grad_fn=<MseLossBackward>)
output :  tensor([[143469.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6554e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193839.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(3384622.5000, grad_fn=<MseLossBackward>)
output :  tensor([[133479.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(941172.8125, grad_fn=<MseLossBackward>)
output :  tensor([[106706.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(10844827., grad_fn=<MseLossBackward>)
output :  tensor([[229093.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(24075276., grad_fn=<MseLossBackward>)
output :  tensor([[166524.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2058e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161916.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(8508524., grad_fn=<MseLossBackward>)
output :  tensor([[202923.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8756e+10, grad_fn=<MseLossBackward>)
output :  tensor([[246742.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1504e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144797.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1684033.3750, grad_fn=<MseLossBackward>)
output :  tensor([[140500.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(42261376., grad_fn=<MseLossBackward>)
output :  tensor([[156067.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1139856.5000, grad_fn=<MseLossBackward>)
output :  tensor([[133227.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(10417765., grad_fn=<MseLossBackward>)
output :  tensor([[183285.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8851e+09, grad_fn=<MseLossBackward>)
output :  tensor([[181531.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(6595025.5000, grad_fn=<MseLossBackward>)
output :  tensor([[161078.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(177464.7344, grad_fn=<MseLossBackward>)
output :  tensor([[149147.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(37795216., grad_fn=<MseLossBackward>)
output :  tensor([[143217.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(515299.6562, grad_fn=<MseLossBackward>)
output :  tensor([[144454.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(297485.0312, grad_fn=<MseLossBackward>)
output :  tensor([[174897.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1975e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193748.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4065e+08, grad_fn=<MseLossBackward>)
output :  tensor([[138892.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(5726150., grad_fn=<MseLossBackward>)
output :  tensor([[169284.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(6840431.5000, grad_fn=<MseLossBackward>)
output :  tensor([[180056.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(890900., grad_fn=<MseLossBackward>)
output :  tensor([[118177.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(10093627., grad_fn=<MseLossBackward>)
output :  tensor([[222449.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2102454.7500, grad_fn=<MseLossBackward>)
output :  tensor([[181800.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2888087.7500, grad_fn=<MseLossBackward>)
output :  tensor([[128113.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(6827932.5000, grad_fn=<MseLossBackward>)
output :  tensor([[196670.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(29198.2656, grad_fn=<MseLossBackward>)
output :  tensor([[174530.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(136287.8750, grad_fn=<MseLossBackward>)
output :  tensor([[211534.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0525e+10, grad_fn=<MseLossBackward>)
output :  tensor([[208227.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(7684157.5000, grad_fn=<MseLossBackward>)
output :  tensor([[167316.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3189e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192840.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2754822., grad_fn=<MseLossBackward>)
output :  tensor([[111804.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1428809.3750, grad_fn=<MseLossBackward>)
output :  tensor([[114982.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(6163621., grad_fn=<MseLossBackward>)
output :  tensor([[110844.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1334927.5000, grad_fn=<MseLossBackward>)
output :  tensor([[147969.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1367876.5000, grad_fn=<MseLossBackward>)
output :  tensor([[161231.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2910e+10, grad_fn=<MseLossBackward>)
output :  tensor([[179344.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(429905.5938, grad_fn=<MseLossBackward>)
output :  tensor([[127413.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(7480.8984, grad_fn=<MseLossBackward>)
output :  tensor([[143712.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1658863.5000, grad_fn=<MseLossBackward>)
output :  tensor([[183248.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3375e+09, grad_fn=<MseLossBackward>)
output :  tensor([[119481.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(6662004.5000, grad_fn=<MseLossBackward>)
output :  tensor([[200341.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(11164578., grad_fn=<MseLossBackward>)
output :  tensor([[144831.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(28466.0156, grad_fn=<MseLossBackward>)
output :  tensor([[207561.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(28496746., grad_fn=<MseLossBackward>)
output :  tensor([[128186.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(4781260.5000, grad_fn=<MseLossBackward>)
output :  tensor([[246071.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(5091369., grad_fn=<MseLossBackward>)
output :  tensor([[238417.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1699e+09, grad_fn=<MseLossBackward>)
output :  tensor([[147432.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5703e+08, grad_fn=<MseLossBackward>)
output :  tensor([[85312.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9110e+08, grad_fn=<MseLossBackward>)
output :  tensor([[194603.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4476e+09, grad_fn=<MseLossBackward>)
output :  tensor([[81640.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(410400.3750, grad_fn=<MseLossBackward>)
output :  tensor([[139357.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(20399.8730, grad_fn=<MseLossBackward>)
output :  tensor([[77091.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(2532300.2500, grad_fn=<MseLossBackward>)
output :  tensor([[142140.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(660435.5625, grad_fn=<MseLossBackward>)
output :  tensor([[175941.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(3446.0569, grad_fn=<MseLossBackward>)
output :  tensor([[153847.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(120973.5312, grad_fn=<MseLossBackward>)
output :  tensor([[115194.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(60757152., grad_fn=<MseLossBackward>)
output :  tensor([[203903.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2510e+10, grad_fn=<MseLossBackward>)
output :  tensor([[129408.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(824960.6250, grad_fn=<MseLossBackward>)
output :  tensor([[269372.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1295e+08, grad_fn=<MseLossBackward>)
output :  tensor([[303856.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(37739520., grad_fn=<MseLossBackward>)
output :  tensor([[108948.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2099420., grad_fn=<MseLossBackward>)
output :  tensor([[168555.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(15560190., grad_fn=<MseLossBackward>)
output :  tensor([[134462.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0025e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134931.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(16549260., grad_fn=<MseLossBackward>)
output :  tensor([[131725.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2177699.7500, grad_fn=<MseLossBackward>)
output :  tensor([[128751.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(14076390., grad_fn=<MseLossBackward>)
output :  tensor([[133552.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7853e+08, grad_fn=<MseLossBackward>)
output :  tensor([[226823.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8485e+10, grad_fn=<MseLossBackward>)
output :  tensor([[189488.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2956e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143025.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(765023.5625, grad_fn=<MseLossBackward>)
output :  tensor([[126354.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(1311651.2500, grad_fn=<MseLossBackward>)
output :  tensor([[114658.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(11616967., grad_fn=<MseLossBackward>)
output :  tensor([[257862.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6239e+09, grad_fn=<MseLossBackward>)
output :  tensor([[134518.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(232143.2812, grad_fn=<MseLossBackward>)
output :  tensor([[200505.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(6224869., grad_fn=<MseLossBackward>)
output :  tensor([[102606.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(5258565.5000, grad_fn=<MseLossBackward>)
output :  tensor([[137199.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(7562672., grad_fn=<MseLossBackward>)
output :  tensor([[210192.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0472e+08, grad_fn=<MseLossBackward>)
output :  tensor([[182205.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(5314249.5000, grad_fn=<MseLossBackward>)
output :  tensor([[186377.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1896559.3750, grad_fn=<MseLossBackward>)
output :  tensor([[164861.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0776e+10, grad_fn=<MseLossBackward>)
output :  tensor([[299459.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2631e+09, grad_fn=<MseLossBackward>)
output :  tensor([[201141.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(10505398., grad_fn=<MseLossBackward>)
output :  tensor([[263177.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9511e+10, grad_fn=<MseLossBackward>)
output :  tensor([[224158.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7507e+09, grad_fn=<MseLossBackward>)
output :  tensor([[284726.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0416e+09, grad_fn=<MseLossBackward>)
output :  tensor([[221460.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(6447790.5000, grad_fn=<MseLossBackward>)
output :  tensor([[223464.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8404e+10, grad_fn=<MseLossBackward>)
output :  tensor([[196908.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(8423.7979, grad_fn=<MseLossBackward>)
output :  tensor([[160078.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6588e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135569.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(9420008., grad_fn=<MseLossBackward>)
output :  tensor([[136197.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(486615.2500, grad_fn=<MseLossBackward>)
output :  tensor([[91721.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(520404.4375, grad_fn=<MseLossBackward>)
output :  tensor([[106753.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(1554521.8750, grad_fn=<MseLossBackward>)
output :  tensor([[274373.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9731e+09, grad_fn=<MseLossBackward>)
output :  tensor([[235470.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(221826.2812, grad_fn=<MseLossBackward>)
output :  tensor([[146570.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2467992., grad_fn=<MseLossBackward>)
output :  tensor([[138458.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(919021.8125, grad_fn=<MseLossBackward>)
output :  tensor([[175724.]], grad_fn=<AddmmBackward>)
loss:  tensor(3964081., grad_fn=<MseLossBackward>)
output :  tensor([[146335.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1177767.5000, grad_fn=<MseLossBackward>)
output :  tensor([[164126.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2258e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166939.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(3760872.2500, grad_fn=<MseLossBackward>)
output :  tensor([[138037.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1076373.8750, grad_fn=<MseLossBackward>)
output :  tensor([[189631.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5067e+09, grad_fn=<MseLossBackward>)
output :  tensor([[114591.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(6716155.5000, grad_fn=<MseLossBackward>)
output :  tensor([[171537.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(214152.0312, grad_fn=<MseLossBackward>)
output :  tensor([[120016.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(277.4307, grad_fn=<MseLossBackward>)
output :  tensor([[84825.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(4728450., grad_fn=<MseLossBackward>)
output :  tensor([[180584.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(341402.8438, grad_fn=<MseLossBackward>)
output :  tensor([[114218.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(18646540., grad_fn=<MseLossBackward>)
output :  tensor([[242924.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(15400964., grad_fn=<MseLossBackward>)
output :  tensor([[249128.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(17048382., grad_fn=<MseLossBackward>)
output :  tensor([[128331.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1365684.3750, grad_fn=<MseLossBackward>)
output :  tensor([[111742.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(7749568.5000, grad_fn=<MseLossBackward>)
output :  tensor([[288374.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2135e+10, grad_fn=<MseLossBackward>)
output :  tensor([[176001.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(20262096., grad_fn=<MseLossBackward>)
output :  tensor([[123982.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1035179.0625, grad_fn=<MseLossBackward>)
output :  tensor([[143212.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3566e+08, grad_fn=<MseLossBackward>)
output :  tensor([[199752.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0300e+08, grad_fn=<MseLossBackward>)
output :  tensor([[139708.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1669183.2500, grad_fn=<MseLossBackward>)
output :  tensor([[157966.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4892e+10, grad_fn=<MseLossBackward>)
output :  tensor([[153370.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(279907.1250, grad_fn=<MseLossBackward>)
output :  tensor([[129922.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(178196.1094, grad_fn=<MseLossBackward>)
output :  tensor([[250633.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6350e+10, grad_fn=<MseLossBackward>)
output :  tensor([[400412.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2520454., grad_fn=<MseLossBackward>)
output :  tensor([[106388.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(6819238.5000, grad_fn=<MseLossBackward>)
output :  tensor([[109639.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(78509568., grad_fn=<MseLossBackward>)
output :  tensor([[159759.]], grad_fn=<AddmmBackward>)
loss:  tensor(67081., grad_fn=<MseLossBackward>)
output :  tensor([[130308.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6129e+08, grad_fn=<MseLossBackward>)
output :  tensor([[162794.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5053e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173829.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0742e+09, grad_fn=<MseLossBackward>)
output :  tensor([[104903.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1698175.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139264.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3011960.2500, grad_fn=<MseLossBackward>)
output :  tensor([[369032.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(3023686.2500, grad_fn=<MseLossBackward>)
output :  tensor([[205939.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3098e+09, grad_fn=<MseLossBackward>)
output :  tensor([[177723.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(4944160.5000, grad_fn=<MseLossBackward>)
output :  tensor([[198681.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(17792446., grad_fn=<MseLossBackward>)
output :  tensor([[137589.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1988408.5000, grad_fn=<MseLossBackward>)
output :  tensor([[195289.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(623877.8125, grad_fn=<MseLossBackward>)
output :  tensor([[133942.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9918e+08, grad_fn=<MseLossBackward>)
output :  tensor([[185317.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(18638378., grad_fn=<MseLossBackward>)
output :  tensor([[237878.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(16984830., grad_fn=<MseLossBackward>)
output :  tensor([[174760.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(577980.0625, grad_fn=<MseLossBackward>)
output :  tensor([[106504.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(2235702.5000, grad_fn=<MseLossBackward>)
output :  tensor([[265647.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1181161.3750, grad_fn=<MseLossBackward>)
output :  tensor([[252800.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(7844813., grad_fn=<MseLossBackward>)
output :  tensor([[123420.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(176505.0156, grad_fn=<MseLossBackward>)
output :  tensor([[217568.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2983e+09, grad_fn=<MseLossBackward>)
output :  tensor([[304871.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1733e+08, grad_fn=<MseLossBackward>)
output :  tensor([[207328.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(107789.0938, grad_fn=<MseLossBackward>)
output :  tensor([[211276.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6570e+10, grad_fn=<MseLossBackward>)
output :  tensor([[156622.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1632645., grad_fn=<MseLossBackward>)
output :  tensor([[165709.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(18322146., grad_fn=<MseLossBackward>)
output :  tensor([[159124.]], grad_fn=<AddmmBackward>)
loss:  tensor(4804864., grad_fn=<MseLossBackward>)
output :  tensor([[166381.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(13094899., grad_fn=<MseLossBackward>)
output :  tensor([[235478.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0576e+09, grad_fn=<MseLossBackward>)
output :  tensor([[220130.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(86955920., grad_fn=<MseLossBackward>)
output :  tensor([[160477.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8165e+08, grad_fn=<MseLossBackward>)
output :  tensor([[122274.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(526202.8750, grad_fn=<MseLossBackward>)
output :  tensor([[176138.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(741778.5000, grad_fn=<MseLossBackward>)
output :  tensor([[180967.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2461e+09, grad_fn=<MseLossBackward>)
output :  tensor([[207130.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5151e+10, grad_fn=<MseLossBackward>)
output :  tensor([[135157.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(525851.5625, grad_fn=<MseLossBackward>)
output :  tensor([[146962.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4328e+08, grad_fn=<MseLossBackward>)
output :  tensor([[275345.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2736129.5000, grad_fn=<MseLossBackward>)
output :  tensor([[89272.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(18256592., grad_fn=<MseLossBackward>)
output :  tensor([[236766.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(70772.6250, grad_fn=<MseLossBackward>)
output :  tensor([[257558.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0587e+11, grad_fn=<MseLossBackward>)
output :  tensor([[168148.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(3428225.7500, grad_fn=<MseLossBackward>)
output :  tensor([[194380.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6500e+09, grad_fn=<MseLossBackward>)
output :  tensor([[153138.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(3465415., grad_fn=<MseLossBackward>)
output :  tensor([[206349.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0514e+09, grad_fn=<MseLossBackward>)
output :  tensor([[129976.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(954406.8750, grad_fn=<MseLossBackward>)
output :  tensor([[148880.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(15056461., grad_fn=<MseLossBackward>)
output :  tensor([[169087.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0692e+08, grad_fn=<MseLossBackward>)
output :  tensor([[189306.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(11949769., grad_fn=<MseLossBackward>)
output :  tensor([[126533.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(284480.5625, grad_fn=<MseLossBackward>)
output :  tensor([[137584.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1176275.8750, grad_fn=<MseLossBackward>)
output :  tensor([[175498.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(6243205., grad_fn=<MseLossBackward>)
output :  tensor([[196673.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8437e+09, grad_fn=<MseLossBackward>)
output :  tensor([[239827.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(10063368., grad_fn=<MseLossBackward>)
output :  tensor([[153006.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(3972734., grad_fn=<MseLossBackward>)
output :  tensor([[196844.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(712415.1250, grad_fn=<MseLossBackward>)
output :  tensor([[159787.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4925e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181347.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3413718.2500, grad_fn=<MseLossBackward>)
output :  tensor([[178788.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1235189.1250, grad_fn=<MseLossBackward>)
output :  tensor([[99268.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(5144958., grad_fn=<MseLossBackward>)
output :  tensor([[172172.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1627e+10, grad_fn=<MseLossBackward>)
output :  tensor([[133453.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2393015.7500, grad_fn=<MseLossBackward>)
output :  tensor([[120737.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(32914514., grad_fn=<MseLossBackward>)
output :  tensor([[170357.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(13268945., grad_fn=<MseLossBackward>)
output :  tensor([[86561.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2439600., grad_fn=<MseLossBackward>)
output :  tensor([[286352.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(13304256., grad_fn=<MseLossBackward>)
output :  tensor([[167199.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(4837937.5000, grad_fn=<MseLossBackward>)
output :  tensor([[192681.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9736e+10, grad_fn=<MseLossBackward>)
output :  tensor([[246312.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0949e+08, grad_fn=<MseLossBackward>)
output :  tensor([[150360.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(409420.0312, grad_fn=<MseLossBackward>)
output :  tensor([[123086.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(834482.2500, grad_fn=<MseLossBackward>)
output :  tensor([[121084.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(1403243.8750, grad_fn=<MseLossBackward>)
output :  tensor([[145207.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(9.1250e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173369.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(397569.6562, grad_fn=<MseLossBackward>)
output :  tensor([[111138.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2016e+08, grad_fn=<MseLossBackward>)
output :  tensor([[209617.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1747e+10, grad_fn=<MseLossBackward>)
output :  tensor([[241397.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(10541.5137, grad_fn=<MseLossBackward>)
output :  tensor([[250421.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0958e+10, grad_fn=<MseLossBackward>)
output :  tensor([[221394.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0996e+08, grad_fn=<MseLossBackward>)
output :  tensor([[197860.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3839e+10, grad_fn=<MseLossBackward>)
output :  tensor([[191291.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(14376302., grad_fn=<MseLossBackward>)
output :  tensor([[207158.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7399e+10, grad_fn=<MseLossBackward>)
output :  tensor([[189570.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1442e+10, grad_fn=<MseLossBackward>)
output :  tensor([[182525.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(14326816., grad_fn=<MseLossBackward>)
output :  tensor([[153188.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1412940.8750, grad_fn=<MseLossBackward>)
output :  tensor([[335055.]], grad_fn=<AddmmBackward>)
loss:  tensor(3783025., grad_fn=<MseLossBackward>)
output :  tensor([[215628.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(13166693., grad_fn=<MseLossBackward>)
output :  tensor([[159693.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(93655.1250, grad_fn=<MseLossBackward>)
output :  tensor([[187195.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9490e+09, grad_fn=<MseLossBackward>)
output :  tensor([[104376.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(389239.5000, grad_fn=<MseLossBackward>)
output :  tensor([[273742.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9106e+10, grad_fn=<MseLossBackward>)
output :  tensor([[171777.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(4505736., grad_fn=<MseLossBackward>)
output :  tensor([[214646.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1314605.6250, grad_fn=<MseLossBackward>)
output :  tensor([[209812.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2516e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178537.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(439216.8438, grad_fn=<MseLossBackward>)
output :  tensor([[199543.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(5092145., grad_fn=<MseLossBackward>)
output :  tensor([[153861.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1297071.8750, grad_fn=<MseLossBackward>)
output :  tensor([[146929.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2024e+09, grad_fn=<MseLossBackward>)
output :  tensor([[117053.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(2093063., grad_fn=<MseLossBackward>)
output :  tensor([[140771.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(595405.1250, grad_fn=<MseLossBackward>)
output :  tensor([[148541.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(210609.2812, grad_fn=<MseLossBackward>)
output :  tensor([[202503.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5749e+10, grad_fn=<MseLossBackward>)
output :  tensor([[160388.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(789126.8750, grad_fn=<MseLossBackward>)
output :  tensor([[100280.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(609241.2500, grad_fn=<MseLossBackward>)
output :  tensor([[224165.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5074e+08, grad_fn=<MseLossBackward>)
output :  tensor([[184938.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7785e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175776.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(501463.1562, grad_fn=<MseLossBackward>)
output :  tensor([[78842.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(9971829., grad_fn=<MseLossBackward>)
output :  tensor([[128997.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(247280.8750, grad_fn=<MseLossBackward>)
output :  tensor([[218403.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(19391226., grad_fn=<MseLossBackward>)
output :  tensor([[143617.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(146449.7188, grad_fn=<MseLossBackward>)
output :  tensor([[132380.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(5665292.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144972.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(5628237.5000, grad_fn=<MseLossBackward>)
output :  tensor([[177207.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5766e+09, grad_fn=<MseLossBackward>)
output :  tensor([[143937.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3910.1572, grad_fn=<MseLossBackward>)
output :  tensor([[158534.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2148331.5000, grad_fn=<MseLossBackward>)
output :  tensor([[213386.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2602222.7500, grad_fn=<MseLossBackward>)
output :  tensor([[138152.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0991e+09, grad_fn=<MseLossBackward>)
output :  tensor([[254644.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(126669.2578, grad_fn=<MseLossBackward>)
output :  tensor([[159725.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(50688.3008, grad_fn=<MseLossBackward>)
output :  tensor([[129726.4922]], grad_fn=<AddmmBackward>)
loss:  tensor(1504283.1250, grad_fn=<MseLossBackward>)
output :  tensor([[93153.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(3410976., grad_fn=<MseLossBackward>)
output :  tensor([[153262.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7283e+09, grad_fn=<MseLossBackward>)
output :  tensor([[178598.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1693007.6250, grad_fn=<MseLossBackward>)
output :  tensor([[123461.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(8770714., grad_fn=<MseLossBackward>)
output :  tensor([[187579.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7115e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145325.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3330e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150423.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(273578.0312, grad_fn=<MseLossBackward>)
output :  tensor([[187850.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(10156.8604, grad_fn=<MseLossBackward>)
output :  tensor([[255265.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4297e+09, grad_fn=<MseLossBackward>)
output :  tensor([[90256.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1545554., grad_fn=<MseLossBackward>)
output :  tensor([[242294.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(5264085., grad_fn=<MseLossBackward>)
output :  tensor([[131412.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(8480927., grad_fn=<MseLossBackward>)
output :  tensor([[164485.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0285e+10, grad_fn=<MseLossBackward>)
output :  tensor([[114696.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1598e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178781.]], grad_fn=<AddmmBackward>)
loss:  tensor(7733961., grad_fn=<MseLossBackward>)
output :  tensor([[163442.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7805e+08, grad_fn=<MseLossBackward>)
output :  tensor([[156417.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7171e+08, grad_fn=<MseLossBackward>)
output :  tensor([[239133.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(17851.4648, grad_fn=<MseLossBackward>)
output :  tensor([[227187.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(9.4940e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129279.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(5195693., grad_fn=<MseLossBackward>)
output :  tensor([[123790.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(4883478.5000, grad_fn=<MseLossBackward>)
output :  tensor([[223773.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(10413428., grad_fn=<MseLossBackward>)
output :  tensor([[229843.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(17274804., grad_fn=<MseLossBackward>)
output :  tensor([[227905.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1454360.6250, grad_fn=<MseLossBackward>)
output :  tensor([[145251.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(7555369., grad_fn=<MseLossBackward>)
output :  tensor([[208097.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(3620754.7500, grad_fn=<MseLossBackward>)
output :  tensor([[127596.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(57704556., grad_fn=<MseLossBackward>)
output :  tensor([[135430.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(8586823., grad_fn=<MseLossBackward>)
output :  tensor([[312377.]], grad_fn=<AddmmBackward>)
loss:  tensor(6880129., grad_fn=<MseLossBackward>)
output :  tensor([[143020.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(4083872.5000, grad_fn=<MseLossBackward>)
output :  tensor([[120511.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8635e+09, grad_fn=<MseLossBackward>)
output :  tensor([[109618.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(14099.7070, grad_fn=<MseLossBackward>)
output :  tensor([[155165.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0048e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181604.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(8.6714e+09, grad_fn=<MseLossBackward>)
output :  tensor([[172149.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(722978.1875, grad_fn=<MseLossBackward>)
output :  tensor([[193764.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(52350200., grad_fn=<MseLossBackward>)
output :  tensor([[98510.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2220053.5000, grad_fn=<MseLossBackward>)
output :  tensor([[177782.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1483257.6250, grad_fn=<MseLossBackward>)
output :  tensor([[167124.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(601982., grad_fn=<MseLossBackward>)
output :  tensor([[135865.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(9823131., grad_fn=<MseLossBackward>)
output :  tensor([[258653.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0089e+10, grad_fn=<MseLossBackward>)
output :  tensor([[142307.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2842e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173437.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(191570.3438, grad_fn=<MseLossBackward>)
output :  tensor([[141489.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2217958.7500, grad_fn=<MseLossBackward>)
output :  tensor([[201589.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1186737.8750, grad_fn=<MseLossBackward>)
output :  tensor([[166142.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(14883923., grad_fn=<MseLossBackward>)
output :  tensor([[244336.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(112980.0156, grad_fn=<MseLossBackward>)
output :  tensor([[133434.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1135290.2500, grad_fn=<MseLossBackward>)
output :  tensor([[148342.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1014647., grad_fn=<MseLossBackward>)
output :  tensor([[215256.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(65696.0938, grad_fn=<MseLossBackward>)
output :  tensor([[163340.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2754147.7500, grad_fn=<MseLossBackward>)
output :  tensor([[190831.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3354506.7500, grad_fn=<MseLossBackward>)
output :  tensor([[132545.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9984e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129364.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(132826.0781, grad_fn=<MseLossBackward>)
output :  tensor([[140874.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(765515.6250, grad_fn=<MseLossBackward>)
output :  tensor([[201685.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5987e+09, grad_fn=<MseLossBackward>)
output :  tensor([[165075.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5076e+09, grad_fn=<MseLossBackward>)
output :  tensor([[75139.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2921e+08, grad_fn=<MseLossBackward>)
output :  tensor([[95146.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1336e+08, grad_fn=<MseLossBackward>)
output :  tensor([[251318.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(3900563.2500, grad_fn=<MseLossBackward>)
output :  tensor([[203881.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2096e+09, grad_fn=<MseLossBackward>)
output :  tensor([[119350.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(18927870., grad_fn=<MseLossBackward>)
output :  tensor([[159482.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8500e+08, grad_fn=<MseLossBackward>)
output :  tensor([[205701.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0445e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181186.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8879e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157965.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(8792615., grad_fn=<MseLossBackward>)
output :  tensor([[170429.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(184470.2500, grad_fn=<MseLossBackward>)
output :  tensor([[115702.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(493890.5000, grad_fn=<MseLossBackward>)
output :  tensor([[161927.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(47989392., grad_fn=<MseLossBackward>)
output :  tensor([[191233.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4543e+08, grad_fn=<MseLossBackward>)
output :  tensor([[221752.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(5075727.5000, grad_fn=<MseLossBackward>)
output :  tensor([[246379.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4862e+11, grad_fn=<MseLossBackward>)
output :  tensor([[148745.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(3047588.5000, grad_fn=<MseLossBackward>)
output :  tensor([[108920.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(194370.7656, grad_fn=<MseLossBackward>)
output :  tensor([[169480.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5425e+08, grad_fn=<MseLossBackward>)
output :  tensor([[147326.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(10071301., grad_fn=<MseLossBackward>)
output :  tensor([[232579.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(19536676., grad_fn=<MseLossBackward>)
output :  tensor([[115363.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(132143.6094, grad_fn=<MseLossBackward>)
output :  tensor([[186658.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(14128202., grad_fn=<MseLossBackward>)
output :  tensor([[189920.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(10368803., grad_fn=<MseLossBackward>)
output :  tensor([[163690.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4433e+10, grad_fn=<MseLossBackward>)
output :  tensor([[94816.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9090e+08, grad_fn=<MseLossBackward>)
output :  tensor([[233758.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(27477090., grad_fn=<MseLossBackward>)
output :  tensor([[177474.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2173966., grad_fn=<MseLossBackward>)
output :  tensor([[138375.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(2640168., grad_fn=<MseLossBackward>)
output :  tensor([[235888.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(789682.1875, grad_fn=<MseLossBackward>)
output :  tensor([[161377.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2631188.2500, grad_fn=<MseLossBackward>)
output :  tensor([[204295.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4570e+10, grad_fn=<MseLossBackward>)
output :  tensor([[133588.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1992773.3750, grad_fn=<MseLossBackward>)
output :  tensor([[185845.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6860e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133528.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(6108312., grad_fn=<MseLossBackward>)
output :  tensor([[227731.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(68366024., grad_fn=<MseLossBackward>)
output :  tensor([[226096.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7138e+08, grad_fn=<MseLossBackward>)
output :  tensor([[90420.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(176636.3281, grad_fn=<MseLossBackward>)
output :  tensor([[162736.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(10907125., grad_fn=<MseLossBackward>)
output :  tensor([[244562.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5955e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145630.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(397471.1562, grad_fn=<MseLossBackward>)
output :  tensor([[107795.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6643e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164238.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(68194.4297, grad_fn=<MseLossBackward>)
output :  tensor([[141580.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(5854812., grad_fn=<MseLossBackward>)
output :  tensor([[130977.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(7714202.5000, grad_fn=<MseLossBackward>)
output :  tensor([[190707.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6639e+09, grad_fn=<MseLossBackward>)
output :  tensor([[123397.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(805997.1250, grad_fn=<MseLossBackward>)
output :  tensor([[152333.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(110972.2656, grad_fn=<MseLossBackward>)
output :  tensor([[165856.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(34735184., grad_fn=<MseLossBackward>)
output :  tensor([[149528.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2164668.5000, grad_fn=<MseLossBackward>)
output :  tensor([[161216.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2833330.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135214.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8720e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131531.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(219389.7812, grad_fn=<MseLossBackward>)
output :  tensor([[156544.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0780e+08, grad_fn=<MseLossBackward>)
output :  tensor([[145777.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2640777.2500, grad_fn=<MseLossBackward>)
output :  tensor([[156462.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(27962614., grad_fn=<MseLossBackward>)
output :  tensor([[136317.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9788e+08, grad_fn=<MseLossBackward>)
output :  tensor([[149252.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(204883.5312, grad_fn=<MseLossBackward>)
output :  tensor([[184673.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(11065290., grad_fn=<MseLossBackward>)
output :  tensor([[168201.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(637876.7500, grad_fn=<MseLossBackward>)
output :  tensor([[178565.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2058148.8750, grad_fn=<MseLossBackward>)
output :  tensor([[215430.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(20883758., grad_fn=<MseLossBackward>)
output :  tensor([[108452.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(305532.5625, grad_fn=<MseLossBackward>)
output :  tensor([[136560.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3596e+08, grad_fn=<MseLossBackward>)
output :  tensor([[279893.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(37290488., grad_fn=<MseLossBackward>)
output :  tensor([[118384.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(5685132.5000, grad_fn=<MseLossBackward>)
output :  tensor([[178130.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7530e+09, grad_fn=<MseLossBackward>)
output :  tensor([[181360.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(13243003., grad_fn=<MseLossBackward>)
output :  tensor([[173778.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3740e+08, grad_fn=<MseLossBackward>)
output :  tensor([[249101.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7073e+08, grad_fn=<MseLossBackward>)
output :  tensor([[219349.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(7022997., grad_fn=<MseLossBackward>)
output :  tensor([[125001.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6488e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174898.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7955e+08, grad_fn=<MseLossBackward>)
output :  tensor([[123998.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0889, grad_fn=<MseLossBackward>)
output :  tensor([[181716.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6081e+10, grad_fn=<MseLossBackward>)
output :  tensor([[152480.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(270205.0312, grad_fn=<MseLossBackward>)
output :  tensor([[154427.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(62852440., grad_fn=<MseLossBackward>)
output :  tensor([[210366.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(16533500., grad_fn=<MseLossBackward>)
output :  tensor([[145842.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7802e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177328.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1765078.3750, grad_fn=<MseLossBackward>)
output :  tensor([[251929.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6016e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148216.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(46987.3359, grad_fn=<MseLossBackward>)
output :  tensor([[200475.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(4792268.5000, grad_fn=<MseLossBackward>)
output :  tensor([[159101.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(719766.6250, grad_fn=<MseLossBackward>)
output :  tensor([[124511.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3331e+09, grad_fn=<MseLossBackward>)
output :  tensor([[134117.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2664393., grad_fn=<MseLossBackward>)
output :  tensor([[186948.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(8696048., grad_fn=<MseLossBackward>)
output :  tensor([[196417.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(41183904., grad_fn=<MseLossBackward>)
output :  tensor([[227459.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7873e+09, grad_fn=<MseLossBackward>)
output :  tensor([[253718.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(10766499., grad_fn=<MseLossBackward>)
output :  tensor([[183988.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8228e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144080.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7647e+09, grad_fn=<MseLossBackward>)
output :  tensor([[140564.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(15484717., grad_fn=<MseLossBackward>)
output :  tensor([[73527.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1241e+09, grad_fn=<MseLossBackward>)
output :  tensor([[135527.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(278338.6875, grad_fn=<MseLossBackward>)
output :  tensor([[127315.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(2509229.2500, grad_fn=<MseLossBackward>)
output :  tensor([[155208.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1460472.2500, grad_fn=<MseLossBackward>)
output :  tensor([[125170.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3348557., grad_fn=<MseLossBackward>)
output :  tensor([[79503.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(9021388., grad_fn=<MseLossBackward>)
output :  tensor([[83319.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(1740894.7500, grad_fn=<MseLossBackward>)
output :  tensor([[229269.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(7458275.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140287.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7217e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133042.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(6463670.5000, grad_fn=<MseLossBackward>)
output :  tensor([[169100.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(4411378., grad_fn=<MseLossBackward>)
output :  tensor([[234522.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(228036.0938, grad_fn=<MseLossBackward>)
output :  tensor([[189417.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(7414473.5000, grad_fn=<MseLossBackward>)
output :  tensor([[156707.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(500711.0312, grad_fn=<MseLossBackward>)
output :  tensor([[196097.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(3248950., grad_fn=<MseLossBackward>)
output :  tensor([[204231.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0738e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137589.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(347031.4375, grad_fn=<MseLossBackward>)
output :  tensor([[155159.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(25425.2988, grad_fn=<MseLossBackward>)
output :  tensor([[135327.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(452025.0938, grad_fn=<MseLossBackward>)
output :  tensor([[198845.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(9.7061e+08, grad_fn=<MseLossBackward>)
output :  tensor([[152023.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(3907664., grad_fn=<MseLossBackward>)
output :  tensor([[137356.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9234e+09, grad_fn=<MseLossBackward>)
output :  tensor([[148350.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(11909185., grad_fn=<MseLossBackward>)
output :  tensor([[209871.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(4530445.5000, grad_fn=<MseLossBackward>)
output :  tensor([[101282.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7182e+08, grad_fn=<MseLossBackward>)
output :  tensor([[164270.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(10428358., grad_fn=<MseLossBackward>)
output :  tensor([[127970.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(883.2041, grad_fn=<MseLossBackward>)
output :  tensor([[148850.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3424813., grad_fn=<MseLossBackward>)
output :  tensor([[106119.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9129e+09, grad_fn=<MseLossBackward>)
output :  tensor([[139848.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(5514351.5000, grad_fn=<MseLossBackward>)
output :  tensor([[233282.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(7384212., grad_fn=<MseLossBackward>)
output :  tensor([[144053.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(895803.1250, grad_fn=<MseLossBackward>)
output :  tensor([[137798.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(89214.2188, grad_fn=<MseLossBackward>)
output :  tensor([[162581.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1959e+09, grad_fn=<MseLossBackward>)
output :  tensor([[271447.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(42929524., grad_fn=<MseLossBackward>)
output :  tensor([[172129.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(8238425., grad_fn=<MseLossBackward>)
output :  tensor([[103875.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1209072., grad_fn=<MseLossBackward>)
output :  tensor([[201124.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8332e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161479.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(6150167.5000, grad_fn=<MseLossBackward>)
output :  tensor([[161165.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6768e+10, grad_fn=<MseLossBackward>)
output :  tensor([[100158.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3453673.7500, grad_fn=<MseLossBackward>)
output :  tensor([[122977.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(387185.3438, grad_fn=<MseLossBackward>)
output :  tensor([[156430.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(185693.6562, grad_fn=<MseLossBackward>)
output :  tensor([[139383.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(380361.2812, grad_fn=<MseLossBackward>)
output :  tensor([[197961.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(4156756.5000, grad_fn=<MseLossBackward>)
output :  tensor([[141323.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(457292.9375, grad_fn=<MseLossBackward>)
output :  tensor([[259810.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(6099665., grad_fn=<MseLossBackward>)
output :  tensor([[129589.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3388e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161736.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(14160287., grad_fn=<MseLossBackward>)
output :  tensor([[186595.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(3628191.5000, grad_fn=<MseLossBackward>)
output :  tensor([[122837.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6479e+08, grad_fn=<MseLossBackward>)
output :  tensor([[253996.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(15970514., grad_fn=<MseLossBackward>)
output :  tensor([[159772.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4133e+08, grad_fn=<MseLossBackward>)
output :  tensor([[241438.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(15299466., grad_fn=<MseLossBackward>)
output :  tensor([[141561.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(5944987., grad_fn=<MseLossBackward>)
output :  tensor([[211085.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1178988.7500, grad_fn=<MseLossBackward>)
output :  tensor([[177614.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(27190358., grad_fn=<MseLossBackward>)
output :  tensor([[154208.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(43316.0156, grad_fn=<MseLossBackward>)
output :  tensor([[119301.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(1693393.8750, grad_fn=<MseLossBackward>)
output :  tensor([[236868.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5222e+09, grad_fn=<MseLossBackward>)
output :  tensor([[236039.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(15684075., grad_fn=<MseLossBackward>)
output :  tensor([[152074.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1593709., grad_fn=<MseLossBackward>)
output :  tensor([[255221.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(103352.2031, grad_fn=<MseLossBackward>)
output :  tensor([[126067.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3372e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175341.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(434239.8125, grad_fn=<MseLossBackward>)
output :  tensor([[162178.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(4747292., grad_fn=<MseLossBackward>)
output :  tensor([[132562.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2440625., grad_fn=<MseLossBackward>)
output :  tensor([[193559.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1036e+09, grad_fn=<MseLossBackward>)
output :  tensor([[165453.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2111663., grad_fn=<MseLossBackward>)
output :  tensor([[168983.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(35802460., grad_fn=<MseLossBackward>)
output :  tensor([[158123.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(15252.2500, grad_fn=<MseLossBackward>)
output :  tensor([[148745.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1331788.1250, grad_fn=<MseLossBackward>)
output :  tensor([[172228.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9349e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157766.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(4989429.5000, grad_fn=<MseLossBackward>)
output :  tensor([[376381.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(57589128., grad_fn=<MseLossBackward>)
output :  tensor([[136535.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(90929336., grad_fn=<MseLossBackward>)
output :  tensor([[129538.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9394e+09, grad_fn=<MseLossBackward>)
output :  tensor([[279710.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2257412.2500, grad_fn=<MseLossBackward>)
output :  tensor([[160811.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1412829.3750, grad_fn=<MseLossBackward>)
output :  tensor([[130661.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0326e+08, grad_fn=<MseLossBackward>)
output :  tensor([[223878.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(65963584., grad_fn=<MseLossBackward>)
output :  tensor([[182104.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2574019.2500, grad_fn=<MseLossBackward>)
output :  tensor([[151006.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(986918.0625, grad_fn=<MseLossBackward>)
output :  tensor([[144726.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(74998.9609, grad_fn=<MseLossBackward>)
output :  tensor([[154427.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0721e+08, grad_fn=<MseLossBackward>)
output :  tensor([[101648.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(2717320.5000, grad_fn=<MseLossBackward>)
output :  tensor([[74650.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1463e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165415.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(172744.1406, grad_fn=<MseLossBackward>)
output :  tensor([[188855.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5323e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163758.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(33156364., grad_fn=<MseLossBackward>)
output :  tensor([[161272.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(14231756., grad_fn=<MseLossBackward>)
output :  tensor([[138636.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1406966.6250, grad_fn=<MseLossBackward>)
output :  tensor([[204893.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1115895.1250, grad_fn=<MseLossBackward>)
output :  tensor([[140774.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(7698457., grad_fn=<MseLossBackward>)
output :  tensor([[181546.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6500e+10, grad_fn=<MseLossBackward>)
output :  tensor([[146088.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(7804.6182, grad_fn=<MseLossBackward>)
output :  tensor([[110310.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4584e+08, grad_fn=<MseLossBackward>)
output :  tensor([[93875.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(15490.5254, grad_fn=<MseLossBackward>)
output :  tensor([[174724.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(75753.9609, grad_fn=<MseLossBackward>)
output :  tensor([[268983.]], grad_fn=<AddmmBackward>)
loss:  tensor(73667888., grad_fn=<MseLossBackward>)
output :  tensor([[140969.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(281894.6250, grad_fn=<MseLossBackward>)
output :  tensor([[159116.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(606451.5625, grad_fn=<MseLossBackward>)
output :  tensor([[131358.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1303379., grad_fn=<MseLossBackward>)
output :  tensor([[149964.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(215919.9531, grad_fn=<MseLossBackward>)
output :  tensor([[168195.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(87320.2500, grad_fn=<MseLossBackward>)
output :  tensor([[126546.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(205633.9062, grad_fn=<MseLossBackward>)
output :  tensor([[172887.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7773e+08, grad_fn=<MseLossBackward>)
output :  tensor([[157365.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(133898.8125, grad_fn=<MseLossBackward>)
output :  tensor([[113752.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(7546352.5000, grad_fn=<MseLossBackward>)
output :  tensor([[161242.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1491e+09, grad_fn=<MseLossBackward>)
output :  tensor([[51407.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(351343.3125, grad_fn=<MseLossBackward>)
output :  tensor([[230582.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7105e+09, grad_fn=<MseLossBackward>)
output :  tensor([[200517.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(232414.3906, grad_fn=<MseLossBackward>)
output :  tensor([[183945.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1112003.2500, grad_fn=<MseLossBackward>)
output :  tensor([[107178.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1388715., grad_fn=<MseLossBackward>)
output :  tensor([[87895.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(801640.4375, grad_fn=<MseLossBackward>)
output :  tensor([[146118.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(37437956., grad_fn=<MseLossBackward>)
output :  tensor([[222981.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0436e+09, grad_fn=<MseLossBackward>)
output :  tensor([[203510.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(15912744., grad_fn=<MseLossBackward>)
output :  tensor([[168305.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(10929326., grad_fn=<MseLossBackward>)
output :  tensor([[174754.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1443e+09, grad_fn=<MseLossBackward>)
output :  tensor([[188278.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2963938.7500, grad_fn=<MseLossBackward>)
output :  tensor([[86808.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(36822.0117, grad_fn=<MseLossBackward>)
output :  tensor([[138224.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(3152566.7500, grad_fn=<MseLossBackward>)
output :  tensor([[110928.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(183324.4688, grad_fn=<MseLossBackward>)
output :  tensor([[148398.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5473e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172498.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7221e+09, grad_fn=<MseLossBackward>)
output :  tensor([[196468.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(72792360., grad_fn=<MseLossBackward>)
output :  tensor([[179852.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(21765.4688, grad_fn=<MseLossBackward>)
output :  tensor([[96327.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(29785.9062, grad_fn=<MseLossBackward>)
output :  tensor([[119039.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(2370661.7500, grad_fn=<MseLossBackward>)
output :  tensor([[161414.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1010e+08, grad_fn=<MseLossBackward>)
output :  tensor([[202445.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(5980317.5000, grad_fn=<MseLossBackward>)
output :  tensor([[147996.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(15969265., grad_fn=<MseLossBackward>)
train_loss: [2.5973458e+09]
epoch_result tensor([0.])
output :  tensor([[161890.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(11496656., grad_fn=<MseLossBackward>)
output :  tensor([[123631.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(2660339.5000, grad_fn=<MseLossBackward>)
output :  tensor([[198128.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(15426115., grad_fn=<MseLossBackward>)
output :  tensor([[177628.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(395110.4688, grad_fn=<MseLossBackward>)
output :  tensor([[153030.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2348e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128989.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(979295.8125, grad_fn=<MseLossBackward>)
output :  tensor([[139480.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2307408.5000, grad_fn=<MseLossBackward>)
output :  tensor([[119113.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(12862.7500, grad_fn=<MseLossBackward>)
output :  tensor([[66533.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(64543272., grad_fn=<MseLossBackward>)
output :  tensor([[165393.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(368411.0625, grad_fn=<MseLossBackward>)
output :  tensor([[136660.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(11150069., grad_fn=<MseLossBackward>)
output :  tensor([[226486.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2210193.2500, grad_fn=<MseLossBackward>)
output :  tensor([[166183.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(7935313., grad_fn=<MseLossBackward>)
output :  tensor([[250484.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(615293.1875, grad_fn=<MseLossBackward>)
output :  tensor([[57592.4023]], grad_fn=<AddmmBackward>)
loss:  tensor(6720550., grad_fn=<MseLossBackward>)
output :  tensor([[161588.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9203e+08, grad_fn=<MseLossBackward>)
output :  tensor([[168863.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(37656824., grad_fn=<MseLossBackward>)
output :  tensor([[156830.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(109178.6172, grad_fn=<MseLossBackward>)
output :  tensor([[274134.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(749252.5625, grad_fn=<MseLossBackward>)
output :  tensor([[200522.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(12406355., grad_fn=<MseLossBackward>)
output :  tensor([[138383.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5140e+10, grad_fn=<MseLossBackward>)
output :  tensor([[192040.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3378761., grad_fn=<MseLossBackward>)
output :  tensor([[179947.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0207e+09, grad_fn=<MseLossBackward>)
output :  tensor([[152346.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1813693.5000, grad_fn=<MseLossBackward>)
output :  tensor([[171502.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2257647., grad_fn=<MseLossBackward>)
output :  tensor([[87055.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2739800.7500, grad_fn=<MseLossBackward>)
output :  tensor([[170285.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2816e+09, grad_fn=<MseLossBackward>)
output :  tensor([[186690.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2859269.7500, grad_fn=<MseLossBackward>)
output :  tensor([[206361.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4146e+09, grad_fn=<MseLossBackward>)
output :  tensor([[110930.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(866426.4375, grad_fn=<MseLossBackward>)
output :  tensor([[170602.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(157819.9844, grad_fn=<MseLossBackward>)
output :  tensor([[136769.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(72706.0703, grad_fn=<MseLossBackward>)
output :  tensor([[131020.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(4081725.7500, grad_fn=<MseLossBackward>)
output :  tensor([[119617.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(13894.5156, grad_fn=<MseLossBackward>)
output :  tensor([[148349.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(9.8281e+08, grad_fn=<MseLossBackward>)
output :  tensor([[168249.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1536e+10, grad_fn=<MseLossBackward>)
output :  tensor([[149625.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(5622.6562, grad_fn=<MseLossBackward>)
output :  tensor([[183047.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(9288209., grad_fn=<MseLossBackward>)
output :  tensor([[143969.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(8819415., grad_fn=<MseLossBackward>)
output :  tensor([[106219.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6308e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136830.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1105e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136925.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(3707490., grad_fn=<MseLossBackward>)
output :  tensor([[128273.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1621205.3750, grad_fn=<MseLossBackward>)
output :  tensor([[224155.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(712362.3750, grad_fn=<MseLossBackward>)
output :  tensor([[131847.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(161880.5000, grad_fn=<MseLossBackward>)
output :  tensor([[152213.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(10328189., grad_fn=<MseLossBackward>)
output :  tensor([[113316.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(1732740.2500, grad_fn=<MseLossBackward>)
output :  tensor([[162560.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(6556480.5000, grad_fn=<MseLossBackward>)
output :  tensor([[147214.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2834e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192691.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(478107.4375, grad_fn=<MseLossBackward>)
output :  tensor([[135666.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1478770., grad_fn=<MseLossBackward>)
output :  tensor([[119753.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(95128632., grad_fn=<MseLossBackward>)
output :  tensor([[231348.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(7029458., grad_fn=<MseLossBackward>)
output :  tensor([[167389.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1253e+09, grad_fn=<MseLossBackward>)
output :  tensor([[160396.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1949906.7500, grad_fn=<MseLossBackward>)
output :  tensor([[203138.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8683e+10, grad_fn=<MseLossBackward>)
output :  tensor([[245150.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1848e+10, grad_fn=<MseLossBackward>)
output :  tensor([[141842.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2746736.5000, grad_fn=<MseLossBackward>)
output :  tensor([[136858.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(8168700., grad_fn=<MseLossBackward>)
output :  tensor([[150526.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(20012902., grad_fn=<MseLossBackward>)
output :  tensor([[135103.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(26040928., grad_fn=<MseLossBackward>)
output :  tensor([[180766.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2779e+09, grad_fn=<MseLossBackward>)
output :  tensor([[182803.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1681155.3750, grad_fn=<MseLossBackward>)
output :  tensor([[164606.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(9652187., grad_fn=<MseLossBackward>)
output :  tensor([[136430.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(43157716., grad_fn=<MseLossBackward>)
output :  tensor([[143184.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(468133.9062, grad_fn=<MseLossBackward>)
output :  tensor([[150152.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(26550350., grad_fn=<MseLossBackward>)
output :  tensor([[173666.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3585e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194135.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2277e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136061.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(191953.5156, grad_fn=<MseLossBackward>)
output :  tensor([[172640.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(547923.8125, grad_fn=<MseLossBackward>)
output :  tensor([[182216.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1480062.3750, grad_fn=<MseLossBackward>)
output :  tensor([[115116.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(13623.2666, grad_fn=<MseLossBackward>)
output :  tensor([[219135.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(3477584., grad_fn=<MseLossBackward>)
output :  tensor([[186234.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(7476465., grad_fn=<MseLossBackward>)
output :  tensor([[128983.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(12132758., grad_fn=<MseLossBackward>)
output :  tensor([[195254.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1552243.5000, grad_fn=<MseLossBackward>)
output :  tensor([[177910.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(9063487., grad_fn=<MseLossBackward>)
output :  tensor([[206895.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2168e+10, grad_fn=<MseLossBackward>)
output :  tensor([[208769.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(4974642.5000, grad_fn=<MseLossBackward>)
output :  tensor([[166653.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2712e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195606.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1223858.2500, grad_fn=<MseLossBackward>)
output :  tensor([[114420.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2016533.1250, grad_fn=<MseLossBackward>)
output :  tensor([[115649.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(9920876., grad_fn=<MseLossBackward>)
output :  tensor([[112335.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(112738.5547, grad_fn=<MseLossBackward>)
output :  tensor([[146494.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(93177.5625, grad_fn=<MseLossBackward>)
output :  tensor([[160683.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3109e+10, grad_fn=<MseLossBackward>)
output :  tensor([[180862.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(743528.9375, grad_fn=<MseLossBackward>)
output :  tensor([[127851.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(123816.0156, grad_fn=<MseLossBackward>)
output :  tensor([[145544.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(296174.0625, grad_fn=<MseLossBackward>)
output :  tensor([[181882.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2073e+09, grad_fn=<MseLossBackward>)
output :  tensor([[116478.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(177510.8125, grad_fn=<MseLossBackward>)
output :  tensor([[194464.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(6429394., grad_fn=<MseLossBackward>)
output :  tensor([[145545.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(297519.1250, grad_fn=<MseLossBackward>)
output :  tensor([[211826.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1153375.3750, grad_fn=<MseLossBackward>)
output :  tensor([[126412.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(169847.0156, grad_fn=<MseLossBackward>)
output :  tensor([[251582.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(10594516., grad_fn=<MseLossBackward>)
output :  tensor([[240843.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9498e+09, grad_fn=<MseLossBackward>)
output :  tensor([[148862.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0495e+08, grad_fn=<MseLossBackward>)
output :  tensor([[88105.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3473e+08, grad_fn=<MseLossBackward>)
output :  tensor([[193467.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6312e+09, grad_fn=<MseLossBackward>)
output :  tensor([[79973.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(1054231.6250, grad_fn=<MseLossBackward>)
output :  tensor([[141816.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(5364290.5000, grad_fn=<MseLossBackward>)
output :  tensor([[76543.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1089218.3750, grad_fn=<MseLossBackward>)
output :  tensor([[144067.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1242423.7500, grad_fn=<MseLossBackward>)
output :  tensor([[175007.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(984529.0625, grad_fn=<MseLossBackward>)
output :  tensor([[154292.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(628229.6250, grad_fn=<MseLossBackward>)
output :  tensor([[108093.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(481419.1562, grad_fn=<MseLossBackward>)
output :  tensor([[204458.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2386e+10, grad_fn=<MseLossBackward>)
output :  tensor([[129435.]], grad_fn=<AddmmBackward>)
loss:  tensor(874225., grad_fn=<MseLossBackward>)
output :  tensor([[268750.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2654e+08, grad_fn=<MseLossBackward>)
output :  tensor([[301900.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(65605952., grad_fn=<MseLossBackward>)
output :  tensor([[106176.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(1751714.2500, grad_fn=<MseLossBackward>)
output :  tensor([[173503.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1007639.5625, grad_fn=<MseLossBackward>)
output :  tensor([[134961.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2690e+08, grad_fn=<MseLossBackward>)
output :  tensor([[144971.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(35658252., grad_fn=<MseLossBackward>)
output :  tensor([[128108.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(4587929.5000, grad_fn=<MseLossBackward>)
output :  tensor([[121308.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(13628614., grad_fn=<MseLossBackward>)
output :  tensor([[135714.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8719e+08, grad_fn=<MseLossBackward>)
output :  tensor([[226118.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8762e+10, grad_fn=<MseLossBackward>)
output :  tensor([[187079.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3691e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145475.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2483332.7500, grad_fn=<MseLossBackward>)
output :  tensor([[130345.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(8099049., grad_fn=<MseLossBackward>)
output :  tensor([[111816.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(320506.3750, grad_fn=<MseLossBackward>)
output :  tensor([[255557.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9067e+09, grad_fn=<MseLossBackward>)
output :  tensor([[134408.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(349465.7188, grad_fn=<MseLossBackward>)
output :  tensor([[206025.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(9152138., grad_fn=<MseLossBackward>)
output :  tensor([[105660.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(578217.6875, grad_fn=<MseLossBackward>)
output :  tensor([[137585.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(5590343., grad_fn=<MseLossBackward>)
output :  tensor([[208743.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4827e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175423.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(20034856., grad_fn=<MseLossBackward>)
output :  tensor([[186725.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2977188.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162962.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1327e+10, grad_fn=<MseLossBackward>)
output :  tensor([[299313.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2735e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194478.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(11704096., grad_fn=<MseLossBackward>)
output :  tensor([[257799.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1043e+10, grad_fn=<MseLossBackward>)
output :  tensor([[221226.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0047e+09, grad_fn=<MseLossBackward>)
output :  tensor([[280120.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3601e+09, grad_fn=<MseLossBackward>)
output :  tensor([[221111.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(8345418., grad_fn=<MseLossBackward>)
output :  tensor([[222550.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8713e+10, grad_fn=<MseLossBackward>)
output :  tensor([[202953.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(35447140., grad_fn=<MseLossBackward>)
output :  tensor([[158315.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5942e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130487.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(4048427., grad_fn=<MseLossBackward>)
output :  tensor([[133636.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3472166.5000, grad_fn=<MseLossBackward>)
output :  tensor([[90562.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(191009.9688, grad_fn=<MseLossBackward>)
output :  tensor([[107766.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(54555.0898, grad_fn=<MseLossBackward>)
output :  tensor([[274156.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9968e+09, grad_fn=<MseLossBackward>)
output :  tensor([[235561.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(314913.8750, grad_fn=<MseLossBackward>)
output :  tensor([[147573.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(6623626., grad_fn=<MseLossBackward>)
output :  tensor([[138210.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(504788.0625, grad_fn=<MseLossBackward>)
output :  tensor([[171728.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(4018208.2500, grad_fn=<MseLossBackward>)
output :  tensor([[148851.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(12973391., grad_fn=<MseLossBackward>)
output :  tensor([[164213.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(9.1730e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165676.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(457779.0938, grad_fn=<MseLossBackward>)
output :  tensor([[137162.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(26411.3281, grad_fn=<MseLossBackward>)
output :  tensor([[188249.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3230e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113056.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1116786.6250, grad_fn=<MseLossBackward>)
output :  tensor([[176614.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(21297792., grad_fn=<MseLossBackward>)
output :  tensor([[118542.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2124260.7500, grad_fn=<MseLossBackward>)
output :  tensor([[86991.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(73.5842, grad_fn=<MseLossBackward>)
output :  tensor([[177940.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(4242184., grad_fn=<MseLossBackward>)
output :  tensor([[112404.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(6271933.5000, grad_fn=<MseLossBackward>)
output :  tensor([[236095.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(8437663., grad_fn=<MseLossBackward>)
output :  tensor([[244807.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(36966.0703, grad_fn=<MseLossBackward>)
output :  tensor([[133650.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(17225354., grad_fn=<MseLossBackward>)
output :  tensor([[107622.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(1785626.7500, grad_fn=<MseLossBackward>)
output :  tensor([[286471.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2705e+10, grad_fn=<MseLossBackward>)
output :  tensor([[172830.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1771061.8750, grad_fn=<MseLossBackward>)
output :  tensor([[130086.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(25868986., grad_fn=<MseLossBackward>)
output :  tensor([[142003.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7619e+08, grad_fn=<MseLossBackward>)
output :  tensor([[201512.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5594e+08, grad_fn=<MseLossBackward>)
output :  tensor([[144242.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(10513401., grad_fn=<MseLossBackward>)
output :  tensor([[155335.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5541e+10, grad_fn=<MseLossBackward>)
output :  tensor([[157238.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(11143183., grad_fn=<MseLossBackward>)
output :  tensor([[132848.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(11210987., grad_fn=<MseLossBackward>)
output :  tensor([[245239.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7758e+10, grad_fn=<MseLossBackward>)
output :  tensor([[395433.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(43116460., grad_fn=<MseLossBackward>)
output :  tensor([[117816.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(77737288., grad_fn=<MseLossBackward>)
output :  tensor([[117169.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1769731.3750, grad_fn=<MseLossBackward>)
output :  tensor([[159828.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(108127.9375, grad_fn=<MseLossBackward>)
output :  tensor([[130461.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5405e+08, grad_fn=<MseLossBackward>)
output :  tensor([[162415.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5503e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174083.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1067e+09, grad_fn=<MseLossBackward>)
output :  tensor([[106391.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(7791425.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140288.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(506121.0938, grad_fn=<MseLossBackward>)
output :  tensor([[361798.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(30201894., grad_fn=<MseLossBackward>)
output :  tensor([[204957.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4052e+09, grad_fn=<MseLossBackward>)
output :  tensor([[175555.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(3108.0625, grad_fn=<MseLossBackward>)
output :  tensor([[204840.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(3764024.5000, grad_fn=<MseLossBackward>)
output :  tensor([[141559.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(6553040., grad_fn=<MseLossBackward>)
output :  tensor([[194579.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(6283.0391, grad_fn=<MseLossBackward>)
output :  tensor([[136296.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2926e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179599.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1960393.7500, grad_fn=<MseLossBackward>)
output :  tensor([[242057.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(3351.3245, grad_fn=<MseLossBackward>)
output :  tensor([[173148.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(724440.3750, grad_fn=<MseLossBackward>)
output :  tensor([[109038.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(1079407.3750, grad_fn=<MseLossBackward>)
output :  tensor([[262589.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3886689., grad_fn=<MseLossBackward>)
output :  tensor([[249549.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(202781.3438, grad_fn=<MseLossBackward>)
output :  tensor([[120937.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(4255260., grad_fn=<MseLossBackward>)
output :  tensor([[214279.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6870e+09, grad_fn=<MseLossBackward>)
output :  tensor([[304400.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3680e+08, grad_fn=<MseLossBackward>)
output :  tensor([[206334.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(442640.7188, grad_fn=<MseLossBackward>)
output :  tensor([[214636.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5716e+10, grad_fn=<MseLossBackward>)
output :  tensor([[160643.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(7525677.5000, grad_fn=<MseLossBackward>)
output :  tensor([[174027.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(16298504., grad_fn=<MseLossBackward>)
output :  tensor([[161779.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(23501740., grad_fn=<MseLossBackward>)
output :  tensor([[170404.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(163885.8125, grad_fn=<MseLossBackward>)
output :  tensor([[236623.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(9.8451e+08, grad_fn=<MseLossBackward>)
output :  tensor([[221368.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(65405128., grad_fn=<MseLossBackward>)
output :  tensor([[159802.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6391e+08, grad_fn=<MseLossBackward>)
output :  tensor([[119659.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(11160558., grad_fn=<MseLossBackward>)
output :  tensor([[175903.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1202449.3750, grad_fn=<MseLossBackward>)
output :  tensor([[180280.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3552e+09, grad_fn=<MseLossBackward>)
output :  tensor([[208852.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4508e+10, grad_fn=<MseLossBackward>)
output :  tensor([[133656.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(600721.8750, grad_fn=<MseLossBackward>)
output :  tensor([[149604.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8425e+08, grad_fn=<MseLossBackward>)
output :  tensor([[271974.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(25258792., grad_fn=<MseLossBackward>)
output :  tensor([[89773.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(22786600., grad_fn=<MseLossBackward>)
output :  tensor([[232854.]], grad_fn=<AddmmBackward>)
loss:  tensor(13293316., grad_fn=<MseLossBackward>)
output :  tensor([[260290.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0410e+11, grad_fn=<MseLossBackward>)
output :  tensor([[169095.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(817781.1250, grad_fn=<MseLossBackward>)
output :  tensor([[193056.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7593e+09, grad_fn=<MseLossBackward>)
output :  tensor([[155708.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(501330.3750, grad_fn=<MseLossBackward>)
output :  tensor([[207640.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8887e+09, grad_fn=<MseLossBackward>)
output :  tensor([[127829.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1371058., grad_fn=<MseLossBackward>)
output :  tensor([[147061.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(4251715., grad_fn=<MseLossBackward>)
output :  tensor([[169977.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5500e+08, grad_fn=<MseLossBackward>)
output :  tensor([[186978.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1273300.6250, grad_fn=<MseLossBackward>)
output :  tensor([[126047.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(2251.0576, grad_fn=<MseLossBackward>)
output :  tensor([[139284.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(7752309., grad_fn=<MseLossBackward>)
output :  tensor([[167294.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(32549700., grad_fn=<MseLossBackward>)
output :  tensor([[195574.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9621e+09, grad_fn=<MseLossBackward>)
output :  tensor([[238750.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(18056392., grad_fn=<MseLossBackward>)
output :  tensor([[153155.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(3403275.5000, grad_fn=<MseLossBackward>)
output :  tensor([[196410.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(168638.5625, grad_fn=<MseLossBackward>)
output :  tensor([[159640.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4463e+08, grad_fn=<MseLossBackward>)
output :  tensor([[182858.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(11277213., grad_fn=<MseLossBackward>)
output :  tensor([[180471.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(326237.3125, grad_fn=<MseLossBackward>)
output :  tensor([[97694.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(482753.5625, grad_fn=<MseLossBackward>)
output :  tensor([[171990.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1666e+10, grad_fn=<MseLossBackward>)
output :  tensor([[133481.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2306079.5000, grad_fn=<MseLossBackward>)
output :  tensor([[118697.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(13668502., grad_fn=<MseLossBackward>)
output :  tensor([[172464.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2358048.2500, grad_fn=<MseLossBackward>)
output :  tensor([[88652.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(13341213., grad_fn=<MseLossBackward>)
output :  tensor([[285050.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(24501572., grad_fn=<MseLossBackward>)
output :  tensor([[166092.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1192737., grad_fn=<MseLossBackward>)
output :  tensor([[194296.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9285e+10, grad_fn=<MseLossBackward>)
output :  tensor([[243740.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4306e+08, grad_fn=<MseLossBackward>)
output :  tensor([[152138.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1296075.5000, grad_fn=<MseLossBackward>)
output :  tensor([[124450.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(203091.0625, grad_fn=<MseLossBackward>)
output :  tensor([[115459.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(19716514., grad_fn=<MseLossBackward>)
output :  tensor([[149517.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1915e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174018.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(324.5627, grad_fn=<MseLossBackward>)
output :  tensor([[113548.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6403e+08, grad_fn=<MseLossBackward>)
output :  tensor([[214173.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0780e+10, grad_fn=<MseLossBackward>)
output :  tensor([[244323.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(7971887.5000, grad_fn=<MseLossBackward>)
output :  tensor([[250314.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0989e+10, grad_fn=<MseLossBackward>)
output :  tensor([[221468.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0737e+08, grad_fn=<MseLossBackward>)
output :  tensor([[198294.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3737e+10, grad_fn=<MseLossBackward>)
output :  tensor([[190966.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(12017814., grad_fn=<MseLossBackward>)
output :  tensor([[208384.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6866e+10, grad_fn=<MseLossBackward>)
output :  tensor([[191707.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0820e+10, grad_fn=<MseLossBackward>)
output :  tensor([[173510.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(27352574., grad_fn=<MseLossBackward>)
output :  tensor([[151410.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(347473.4062, grad_fn=<MseLossBackward>)
output :  tensor([[341136.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(17111408., grad_fn=<MseLossBackward>)
output :  tensor([[209674.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(5407151., grad_fn=<MseLossBackward>)
output :  tensor([[163773.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(14238595., grad_fn=<MseLossBackward>)
output :  tensor([[185728.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1104e+09, grad_fn=<MseLossBackward>)
output :  tensor([[107964.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(8787843., grad_fn=<MseLossBackward>)
output :  tensor([[273394.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9302e+10, grad_fn=<MseLossBackward>)
output :  tensor([[171592.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(5323763., grad_fn=<MseLossBackward>)
output :  tensor([[217767.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(18215158., grad_fn=<MseLossBackward>)
output :  tensor([[208000.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6899e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178477.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(522277.2188, grad_fn=<MseLossBackward>)
output :  tensor([[199738.]], grad_fn=<AddmmBackward>)
loss:  tensor(4251844., grad_fn=<MseLossBackward>)
output :  tensor([[157378.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(5657113.5000, grad_fn=<MseLossBackward>)
output :  tensor([[146389.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1520e+09, grad_fn=<MseLossBackward>)
output :  tensor([[114503.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(15969327., grad_fn=<MseLossBackward>)
output :  tensor([[139222.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(604214.7500, grad_fn=<MseLossBackward>)
output :  tensor([[150473.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2170465.5000, grad_fn=<MseLossBackward>)
output :  tensor([[202983.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5629e+10, grad_fn=<MseLossBackward>)
output :  tensor([[161949.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(5998749., grad_fn=<MseLossBackward>)
output :  tensor([[98507.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(984312., grad_fn=<MseLossBackward>)
output :  tensor([[225322.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1543e+08, grad_fn=<MseLossBackward>)
output :  tensor([[186617.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4594e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175678.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(651072.5000, grad_fn=<MseLossBackward>)
output :  tensor([[86461.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(19903378., grad_fn=<MseLossBackward>)
output :  tensor([[129311.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(659280.5625, grad_fn=<MseLossBackward>)
output :  tensor([[217114.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(9701765., grad_fn=<MseLossBackward>)
output :  tensor([[145121.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1257937.5000, grad_fn=<MseLossBackward>)
output :  tensor([[131590.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2531131.7500, grad_fn=<MseLossBackward>)
output :  tensor([[145221.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(6874310.5000, grad_fn=<MseLossBackward>)
output :  tensor([[179109.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7314e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144182.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(33340.4766, grad_fn=<MseLossBackward>)
output :  tensor([[162109.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(4449463., grad_fn=<MseLossBackward>)
output :  tensor([[215591.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(350186.5625, grad_fn=<MseLossBackward>)
output :  tensor([[136653.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0020e+09, grad_fn=<MseLossBackward>)
output :  tensor([[254746.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(64428.7188, grad_fn=<MseLossBackward>)
output :  tensor([[157624.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3519024.2500, grad_fn=<MseLossBackward>)
output :  tensor([[129462.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(926346.1250, grad_fn=<MseLossBackward>)
output :  tensor([[94430.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(324036.6562, grad_fn=<MseLossBackward>)
output :  tensor([[156014.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1143e+09, grad_fn=<MseLossBackward>)
output :  tensor([[178785.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1242597.8750, grad_fn=<MseLossBackward>)
output :  tensor([[121068.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(322845.9062, grad_fn=<MseLossBackward>)
output :  tensor([[187520.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7164e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146491.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4878e+09, grad_fn=<MseLossBackward>)
output :  tensor([[149464.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(189306.5781, grad_fn=<MseLossBackward>)
output :  tensor([[187703.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2156.4414, grad_fn=<MseLossBackward>)
output :  tensor([[252108.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6784e+09, grad_fn=<MseLossBackward>)
output :  tensor([[92693.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1423621.8750, grad_fn=<MseLossBackward>)
output :  tensor([[237660.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(5471944.5000, grad_fn=<MseLossBackward>)
output :  tensor([[129520.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(1040415.9375, grad_fn=<MseLossBackward>)
output :  tensor([[166577.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(9.8650e+09, grad_fn=<MseLossBackward>)
output :  tensor([[115109.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2829e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176325.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(106255.6250, grad_fn=<MseLossBackward>)
output :  tensor([[164303.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2019e+08, grad_fn=<MseLossBackward>)
output :  tensor([[154295.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6623e+08, grad_fn=<MseLossBackward>)
output :  tensor([[234165.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(23368160., grad_fn=<MseLossBackward>)
output :  tensor([[226432.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9648e+08, grad_fn=<MseLossBackward>)
output :  tensor([[126860.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(19362.2871, grad_fn=<MseLossBackward>)
output :  tensor([[128519.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(6349376.5000, grad_fn=<MseLossBackward>)
output :  tensor([[226640.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(128925.8750, grad_fn=<MseLossBackward>)
output :  tensor([[229247.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(22588930., grad_fn=<MseLossBackward>)
output :  tensor([[225005.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2869953.7500, grad_fn=<MseLossBackward>)
output :  tensor([[150645.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(6997265., grad_fn=<MseLossBackward>)
output :  tensor([[208414.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2512423.2500, grad_fn=<MseLossBackward>)
output :  tensor([[130555.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1142e+08, grad_fn=<MseLossBackward>)
output :  tensor([[132749.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(62234.6562, grad_fn=<MseLossBackward>)
output :  tensor([[309095.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(34863860., grad_fn=<MseLossBackward>)
output :  tensor([[135777.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(27277280., grad_fn=<MseLossBackward>)
output :  tensor([[122015.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0267e+09, grad_fn=<MseLossBackward>)
output :  tensor([[109175.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(105356.0312, grad_fn=<MseLossBackward>)
output :  tensor([[159242.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7577e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181736.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(8.6469e+09, grad_fn=<MseLossBackward>)
output :  tensor([[178326.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(28368606., grad_fn=<MseLossBackward>)
output :  tensor([[192841.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(66560104., grad_fn=<MseLossBackward>)
output :  tensor([[106681.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(44636596., grad_fn=<MseLossBackward>)
output :  tensor([[177129.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(3497835., grad_fn=<MseLossBackward>)
output :  tensor([[172194.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(18442060., grad_fn=<MseLossBackward>)
output :  tensor([[139274.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(75393.1484, grad_fn=<MseLossBackward>)
output :  tensor([[261700.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(9.4867e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145107.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6129e+09, grad_fn=<MseLossBackward>)
output :  tensor([[172024.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(951935.6250, grad_fn=<MseLossBackward>)
output :  tensor([[141067.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1138889.1250, grad_fn=<MseLossBackward>)
output :  tensor([[198023.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(6134832.5000, grad_fn=<MseLossBackward>)
output :  tensor([[166065.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(15478569., grad_fn=<MseLossBackward>)
output :  tensor([[242767.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1519171.7500, grad_fn=<MseLossBackward>)
output :  tensor([[134117.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(146665.0625, grad_fn=<MseLossBackward>)
output :  tensor([[152611.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(10639217., grad_fn=<MseLossBackward>)
output :  tensor([[210077.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(24234082., grad_fn=<MseLossBackward>)
output :  tensor([[164209.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(624569.1250, grad_fn=<MseLossBackward>)
output :  tensor([[184739.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(18149330., grad_fn=<MseLossBackward>)
output :  tensor([[130670.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0254e+08, grad_fn=<MseLossBackward>)
output :  tensor([[127243.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(3085100.2500, grad_fn=<MseLossBackward>)
output :  tensor([[139353.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(418083.4688, grad_fn=<MseLossBackward>)
output :  tensor([[202807.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4480e+09, grad_fn=<MseLossBackward>)
output :  tensor([[168910.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9063e+09, grad_fn=<MseLossBackward>)
output :  tensor([[74338.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0560e+08, grad_fn=<MseLossBackward>)
output :  tensor([[93799.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(86482880., grad_fn=<MseLossBackward>)
output :  tensor([[255688.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(5737671.5000, grad_fn=<MseLossBackward>)
output :  tensor([[202676.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0547e+09, grad_fn=<MseLossBackward>)
output :  tensor([[114690.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(95799.9219, grad_fn=<MseLossBackward>)
output :  tensor([[161699.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6566e+08, grad_fn=<MseLossBackward>)
output :  tensor([[209478.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1071e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180886.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9412e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157993.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(8962446., grad_fn=<MseLossBackward>)
output :  tensor([[166563.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(11810391., grad_fn=<MseLossBackward>)
output :  tensor([[111370.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(13175142., grad_fn=<MseLossBackward>)
output :  tensor([[162184.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(51611876., grad_fn=<MseLossBackward>)
output :  tensor([[193431.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8141e+08, grad_fn=<MseLossBackward>)
output :  tensor([[220313.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(661426.3750, grad_fn=<MseLossBackward>)
output :  tensor([[246674.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4833e+11, grad_fn=<MseLossBackward>)
output :  tensor([[144841.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(4658380.5000, grad_fn=<MseLossBackward>)
output :  tensor([[109324.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(712481.0625, grad_fn=<MseLossBackward>)
output :  tensor([[170019.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4115e+08, grad_fn=<MseLossBackward>)
output :  tensor([[154399.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(15202567., grad_fn=<MseLossBackward>)
output :  tensor([[237982.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(966043.2500, grad_fn=<MseLossBackward>)
output :  tensor([[115579.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(336372.8125, grad_fn=<MseLossBackward>)
output :  tensor([[177735.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(26674642., grad_fn=<MseLossBackward>)
output :  tensor([[183347.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(11236533., grad_fn=<MseLossBackward>)
output :  tensor([[166923.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3432e+10, grad_fn=<MseLossBackward>)
output :  tensor([[95114.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9922e+08, grad_fn=<MseLossBackward>)
output :  tensor([[238675.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(105127.9297, grad_fn=<MseLossBackward>)
output :  tensor([[179323.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(11043367., grad_fn=<MseLossBackward>)
output :  tensor([[139846.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(23648.6719, grad_fn=<MseLossBackward>)
output :  tensor([[233468.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2345923., grad_fn=<MseLossBackward>)
output :  tensor([[163871.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(760002.5625, grad_fn=<MseLossBackward>)
output :  tensor([[204762.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4457e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134383.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(380053., grad_fn=<MseLossBackward>)
output :  tensor([[187646.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5776e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135619.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(144875.3906, grad_fn=<MseLossBackward>)
output :  tensor([[227569.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(71074384., grad_fn=<MseLossBackward>)
output :  tensor([[227037.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2729e+08, grad_fn=<MseLossBackward>)
output :  tensor([[89727.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(74077.5312, grad_fn=<MseLossBackward>)
output :  tensor([[160276.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(709806.2500, grad_fn=<MseLossBackward>)
output :  tensor([[249794.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4661e+10, grad_fn=<MseLossBackward>)
output :  tensor([[146176.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1384299.3750, grad_fn=<MseLossBackward>)
output :  tensor([[109129.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7749e+09, grad_fn=<MseLossBackward>)
output :  tensor([[169651.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(26536020., grad_fn=<MseLossBackward>)
output :  tensor([[143364.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(403939.6875, grad_fn=<MseLossBackward>)
output :  tensor([[130566.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(5598399.5000, grad_fn=<MseLossBackward>)
output :  tensor([[191399.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5698e+09, grad_fn=<MseLossBackward>)
output :  tensor([[123104.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(365146.3750, grad_fn=<MseLossBackward>)
output :  tensor([[152298.]], grad_fn=<AddmmBackward>)
loss:  tensor(88804., grad_fn=<MseLossBackward>)
output :  tensor([[168663.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(9526386., grad_fn=<MseLossBackward>)
output :  tensor([[151390.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(152221.9062, grad_fn=<MseLossBackward>)
output :  tensor([[163952.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1107032.7500, grad_fn=<MseLossBackward>)
output :  tensor([[136173.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3840e+08, grad_fn=<MseLossBackward>)
output :  tensor([[132439.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(193132.7812, grad_fn=<MseLossBackward>)
output :  tensor([[156405.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0297e+08, grad_fn=<MseLossBackward>)
output :  tensor([[146710.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(6548321., grad_fn=<MseLossBackward>)
output :  tensor([[158116.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(13201982., grad_fn=<MseLossBackward>)
output :  tensor([[138262.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0440e+08, grad_fn=<MseLossBackward>)
output :  tensor([[147907.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(797337.3750, grad_fn=<MseLossBackward>)
output :  tensor([[185885.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(4469590.5000, grad_fn=<MseLossBackward>)
output :  tensor([[171724.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(7424433., grad_fn=<MseLossBackward>)
output :  tensor([[181938.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(3758630.5000, grad_fn=<MseLossBackward>)
output :  tensor([[221504.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2263332.2500, grad_fn=<MseLossBackward>)
output :  tensor([[107347.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(305636.2188, grad_fn=<MseLossBackward>)
output :  tensor([[135447.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1125e+08, grad_fn=<MseLossBackward>)
output :  tensor([[281745.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(18103164., grad_fn=<MseLossBackward>)
output :  tensor([[117809.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(3273131.2500, grad_fn=<MseLossBackward>)
output :  tensor([[178874.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6913e+09, grad_fn=<MseLossBackward>)
output :  tensor([[181035.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(15714287., grad_fn=<MseLossBackward>)
output :  tensor([[192896.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(54705668., grad_fn=<MseLossBackward>)
output :  tensor([[252161.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2161e+08, grad_fn=<MseLossBackward>)
output :  tensor([[222251.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(63032.3789, grad_fn=<MseLossBackward>)
output :  tensor([[125382.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7958e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176151.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3599e+08, grad_fn=<MseLossBackward>)
output :  tensor([[125891.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3575999.2500, grad_fn=<MseLossBackward>)
output :  tensor([[184826.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4492e+10, grad_fn=<MseLossBackward>)
output :  tensor([[153599.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(358988.2188, grad_fn=<MseLossBackward>)
output :  tensor([[153419.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(47878616., grad_fn=<MseLossBackward>)
output :  tensor([[204698.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2565302.7500, grad_fn=<MseLossBackward>)
output :  tensor([[145695.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7413e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175710.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(83719.8047, grad_fn=<MseLossBackward>)
output :  tensor([[252802.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1274e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148953.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(909281.4375, grad_fn=<MseLossBackward>)
output :  tensor([[201988.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(457398.5938, grad_fn=<MseLossBackward>)
output :  tensor([[165237.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(27955344., grad_fn=<MseLossBackward>)
output :  tensor([[123827.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2836e+09, grad_fn=<MseLossBackward>)
output :  tensor([[139205.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(11941668., grad_fn=<MseLossBackward>)
output :  tensor([[178534.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(29876986., grad_fn=<MseLossBackward>)
output :  tensor([[199795.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(95950592., grad_fn=<MseLossBackward>)
output :  tensor([[232070.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2410e+09, grad_fn=<MseLossBackward>)
output :  tensor([[256812.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(35109.3906, grad_fn=<MseLossBackward>)
output :  tensor([[187306.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7343e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144143.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7713e+09, grad_fn=<MseLossBackward>)
output :  tensor([[143226.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1621046.2500, grad_fn=<MseLossBackward>)
output :  tensor([[72593.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0624e+09, grad_fn=<MseLossBackward>)
output :  tensor([[126076.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(79633592., grad_fn=<MseLossBackward>)
output :  tensor([[128624.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(75698.0625, grad_fn=<MseLossBackward>)
output :  tensor([[153342.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(432491.1875, grad_fn=<MseLossBackward>)
output :  tensor([[133953.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(48350076., grad_fn=<MseLossBackward>)
output :  tensor([[77635.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1289395.7500, grad_fn=<MseLossBackward>)
output :  tensor([[82377.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(142482.6562, grad_fn=<MseLossBackward>)
output :  tensor([[242596.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1228e+08, grad_fn=<MseLossBackward>)
output :  tensor([[140135.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6372e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131379.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(773712.6250, grad_fn=<MseLossBackward>)
output :  tensor([[167743.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(552908.4375, grad_fn=<MseLossBackward>)
output :  tensor([[236369.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1875016.7500, grad_fn=<MseLossBackward>)
output :  tensor([[190216.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(3699611.7500, grad_fn=<MseLossBackward>)
output :  tensor([[155856.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(20453.4688, grad_fn=<MseLossBackward>)
output :  tensor([[196733.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1360284.8750, grad_fn=<MseLossBackward>)
output :  tensor([[202336.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2015e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137714.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(510956.9062, grad_fn=<MseLossBackward>)
output :  tensor([[155314.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(98979.0625, grad_fn=<MseLossBackward>)
output :  tensor([[136629.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(396585.0625, grad_fn=<MseLossBackward>)
output :  tensor([[198780.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(9.7466e+08, grad_fn=<MseLossBackward>)
output :  tensor([[158218.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(17791920., grad_fn=<MseLossBackward>)
output :  tensor([[138227.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0005e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144535.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(132894.4219, grad_fn=<MseLossBackward>)
output :  tensor([[209331.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(7120225., grad_fn=<MseLossBackward>)
output :  tensor([[99863.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1910e+08, grad_fn=<MseLossBackward>)
output :  tensor([[167277.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(49547.9766, grad_fn=<MseLossBackward>)
output :  tensor([[127625.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(140595.7031, grad_fn=<MseLossBackward>)
output :  tensor([[144976.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(4094489., grad_fn=<MseLossBackward>)
output :  tensor([[104325.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7592e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136443.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1116621.5000, grad_fn=<MseLossBackward>)
output :  tensor([[237858.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3455358.2500, grad_fn=<MseLossBackward>)
output :  tensor([[146330.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1768983.1250, grad_fn=<MseLossBackward>)
output :  tensor([[141681.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(17487164., grad_fn=<MseLossBackward>)
output :  tensor([[164239.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3133e+09, grad_fn=<MseLossBackward>)
output :  tensor([[270400.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(57749552., grad_fn=<MseLossBackward>)
output :  tensor([[170157.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(23450866., grad_fn=<MseLossBackward>)
output :  tensor([[103050.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(75093.1250, grad_fn=<MseLossBackward>)
output :  tensor([[201162.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8274e+09, grad_fn=<MseLossBackward>)
output :  tensor([[160240.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1538801.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163620.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5713e+10, grad_fn=<MseLossBackward>)
output :  tensor([[99671.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1880669.3750, grad_fn=<MseLossBackward>)
output :  tensor([[122723.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(768183.7500, grad_fn=<MseLossBackward>)
output :  tensor([[157585.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2512918.5000, grad_fn=<MseLossBackward>)
output :  tensor([[142284.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(5217726.5000, grad_fn=<MseLossBackward>)
output :  tensor([[200030.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(946.5237, grad_fn=<MseLossBackward>)
output :  tensor([[143715.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2944602.5000, grad_fn=<MseLossBackward>)
output :  tensor([[262050.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(52663.0781, grad_fn=<MseLossBackward>)
output :  tensor([[126764.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1400e+09, grad_fn=<MseLossBackward>)
output :  tensor([[162924.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(6633763.5000, grad_fn=<MseLossBackward>)
output :  tensor([[188564.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(4122.0410, grad_fn=<MseLossBackward>)
output :  tensor([[124455.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0897e+08, grad_fn=<MseLossBackward>)
output :  tensor([[245417.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(20995870., grad_fn=<MseLossBackward>)
output :  tensor([[158470.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1392e+08, grad_fn=<MseLossBackward>)
output :  tensor([[243529.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3312457., grad_fn=<MseLossBackward>)
output :  tensor([[146557.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(6541525.5000, grad_fn=<MseLossBackward>)
output :  tensor([[207316.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(7201088.5000, grad_fn=<MseLossBackward>)
output :  tensor([[174899.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(6246485., grad_fn=<MseLossBackward>)
output :  tensor([[154872.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(761010.8750, grad_fn=<MseLossBackward>)
output :  tensor([[116849.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1323075., grad_fn=<MseLossBackward>)
output :  tensor([[241822.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0491e+09, grad_fn=<MseLossBackward>)
output :  tensor([[239942.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(3340.4788, grad_fn=<MseLossBackward>)
output :  tensor([[150428.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(8460736., grad_fn=<MseLossBackward>)
output :  tensor([[253317.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2503020.7500, grad_fn=<MseLossBackward>)
output :  tensor([[122689.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(67001388., grad_fn=<MseLossBackward>)
output :  tensor([[176250.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(62640.7031, grad_fn=<MseLossBackward>)
output :  tensor([[160498.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(248673.6406, grad_fn=<MseLossBackward>)
output :  tensor([[128935.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(4262579.5000, grad_fn=<MseLossBackward>)
output :  tensor([[196285.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4603e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164180.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(32580.2500, grad_fn=<MseLossBackward>)
output :  tensor([[168941.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(35298452., grad_fn=<MseLossBackward>)
output :  tensor([[156167.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(3359201.7500, grad_fn=<MseLossBackward>)
output :  tensor([[150970.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1145803., grad_fn=<MseLossBackward>)
output :  tensor([[172525.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9722e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163418.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(11688386., grad_fn=<MseLossBackward>)
output :  tensor([[377131.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(46761664., grad_fn=<MseLossBackward>)
output :  tensor([[120897.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(37242316., grad_fn=<MseLossBackward>)
output :  tensor([[131789.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1428e+09, grad_fn=<MseLossBackward>)
output :  tensor([[281753.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(292545.7500, grad_fn=<MseLossBackward>)
output :  tensor([[164387.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(5699335.5000, grad_fn=<MseLossBackward>)
output :  tensor([[133602.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7166e+08, grad_fn=<MseLossBackward>)
output :  tensor([[239695.]], grad_fn=<AddmmBackward>)
loss:  tensor(59213024., grad_fn=<MseLossBackward>)
output :  tensor([[177261.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(10491020., grad_fn=<MseLossBackward>)
output :  tensor([[156440.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(19721232., grad_fn=<MseLossBackward>)
output :  tensor([[144326.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(454233.8750, grad_fn=<MseLossBackward>)
output :  tensor([[155814.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5775e+08, grad_fn=<MseLossBackward>)
output :  tensor([[102019.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(4080242.2500, grad_fn=<MseLossBackward>)
output :  tensor([[75483.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3973e+08, grad_fn=<MseLossBackward>)
output :  tensor([[164186.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(661401., grad_fn=<MseLossBackward>)
output :  tensor([[192186.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2826e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163983.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(35803208., grad_fn=<MseLossBackward>)
output :  tensor([[155192.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(5325421.5000, grad_fn=<MseLossBackward>)
output :  tensor([[134939.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(6301590.5000, grad_fn=<MseLossBackward>)
output :  tensor([[206362.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(169859.8906, grad_fn=<MseLossBackward>)
output :  tensor([[140070.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(4288005.5000, grad_fn=<MseLossBackward>)
output :  tensor([[183554.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5988e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143366.]], grad_fn=<AddmmBackward>)
loss:  tensor(6937956., grad_fn=<MseLossBackward>)
output :  tensor([[109214.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8721e+08, grad_fn=<MseLossBackward>)
output :  tensor([[96785.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(7757965.5000, grad_fn=<MseLossBackward>)
output :  tensor([[175287.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(82917., grad_fn=<MseLossBackward>)
output :  tensor([[261947.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2394756.2500, grad_fn=<MseLossBackward>)
output :  tensor([[143425.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(3705685.2500, grad_fn=<MseLossBackward>)
output :  tensor([[157794.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4414135.5000, grad_fn=<MseLossBackward>)
output :  tensor([[132819.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(102360., grad_fn=<MseLossBackward>)
output :  tensor([[147465.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(4137982.2500, grad_fn=<MseLossBackward>)
output :  tensor([[165076.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(7973123., grad_fn=<MseLossBackward>)
output :  tensor([[126358.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(411582.4062, grad_fn=<MseLossBackward>)
output :  tensor([[171922.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2482e+08, grad_fn=<MseLossBackward>)
output :  tensor([[156011.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(977441.1875, grad_fn=<MseLossBackward>)
output :  tensor([[116087.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(170414.1562, grad_fn=<MseLossBackward>)
output :  tensor([[161051.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1766e+09, grad_fn=<MseLossBackward>)
output :  tensor([[52586.6289]], grad_fn=<AddmmBackward>)
loss:  tensor(344133.4688, grad_fn=<MseLossBackward>)
output :  tensor([[235806.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8819e+09, grad_fn=<MseLossBackward>)
output :  tensor([[201055.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(3099.3577, grad_fn=<MseLossBackward>)
output :  tensor([[189183.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(17499320., grad_fn=<MseLossBackward>)
output :  tensor([[105297.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(493330.6250, grad_fn=<MseLossBackward>)
output :  tensor([[87542.]], grad_fn=<AddmmBackward>)
loss:  tensor(293764., grad_fn=<MseLossBackward>)
output :  tensor([[132228.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(60390868., grad_fn=<MseLossBackward>)
output :  tensor([[221038.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3234e+09, grad_fn=<MseLossBackward>)
output :  tensor([[205418.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(4333358., grad_fn=<MseLossBackward>)
output :  tensor([[170696.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(32453316., grad_fn=<MseLossBackward>)
output :  tensor([[173160.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4345e+09, grad_fn=<MseLossBackward>)
output :  tensor([[190541.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(293645.4375, grad_fn=<MseLossBackward>)
output :  tensor([[89613.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(6828259., grad_fn=<MseLossBackward>)
output :  tensor([[138279.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2961088., grad_fn=<MseLossBackward>)
output :  tensor([[105909.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(21075130., grad_fn=<MseLossBackward>)
output :  tensor([[149496.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8323e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172020.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6827e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194423.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1187e+08, grad_fn=<MseLossBackward>)
output :  tensor([[182511.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(6308024.5000, grad_fn=<MseLossBackward>)
output :  tensor([[98529.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(4119282.5000, grad_fn=<MseLossBackward>)
output :  tensor([[116484.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(1031224.3750, grad_fn=<MseLossBackward>)
output :  tensor([[161218.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1901e+08, grad_fn=<MseLossBackward>)
output :  tensor([[196199.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(14447126., grad_fn=<MseLossBackward>)
output :  tensor([[143512.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(237473.4688, grad_fn=<MseLossBackward>)
train_loss: [2.5899612e+09]
epoch_result tensor([0.])
output :  tensor([[158548.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2335.6077, grad_fn=<MseLossBackward>)
output :  tensor([[119198.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(7849321.5000, grad_fn=<MseLossBackward>)
output :  tensor([[194141.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(3573.7979, grad_fn=<MseLossBackward>)
output :  tensor([[177173.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(30064.3086, grad_fn=<MseLossBackward>)
output :  tensor([[154439.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5511e+08, grad_fn=<MseLossBackward>)
output :  tensor([[127293.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(498469.0938, grad_fn=<MseLossBackward>)
output :  tensor([[140884.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(13448.7510, grad_fn=<MseLossBackward>)
output :  tensor([[116824.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(4731576.5000, grad_fn=<MseLossBackward>)
output :  tensor([[64799.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(39679568., grad_fn=<MseLossBackward>)
output :  tensor([[166311.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(97197.8047, grad_fn=<MseLossBackward>)
output :  tensor([[143693.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(13643096., grad_fn=<MseLossBackward>)
output :  tensor([[225785.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(616691.1875, grad_fn=<MseLossBackward>)
output :  tensor([[168555.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(197955.4688, grad_fn=<MseLossBackward>)
output :  tensor([[250682.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(964753.6875, grad_fn=<MseLossBackward>)
output :  tensor([[56411.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(1993677.8750, grad_fn=<MseLossBackward>)
output :  tensor([[160438.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5404e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175564.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(318237., grad_fn=<MseLossBackward>)
output :  tensor([[155104.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1947158.6250, grad_fn=<MseLossBackward>)
output :  tensor([[277515.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(6326482.5000, grad_fn=<MseLossBackward>)
output :  tensor([[195463.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2361216.5000, grad_fn=<MseLossBackward>)
output :  tensor([[137294.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5738e+10, grad_fn=<MseLossBackward>)
output :  tensor([[193809.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4769.6289, grad_fn=<MseLossBackward>)
output :  tensor([[179401.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0701e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151048.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2384.1858, grad_fn=<MseLossBackward>)
output :  tensor([[169583.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(173667.5469, grad_fn=<MseLossBackward>)
output :  tensor([[86338.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(880225.1250, grad_fn=<MseLossBackward>)
output :  tensor([[169661.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2106e+09, grad_fn=<MseLossBackward>)
output :  tensor([[184256.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(552141.8750, grad_fn=<MseLossBackward>)
output :  tensor([[206760.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3755e+09, grad_fn=<MseLossBackward>)
output :  tensor([[109802.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(39000.0781, grad_fn=<MseLossBackward>)
output :  tensor([[171104.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(10910.4551, grad_fn=<MseLossBackward>)
output :  tensor([[136103.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(157125.5312, grad_fn=<MseLossBackward>)
output :  tensor([[127906.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(1195281., grad_fn=<MseLossBackward>)
output :  tensor([[119731.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(53780.5078, grad_fn=<MseLossBackward>)
output :  tensor([[145764.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2738e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172064.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0431e+10, grad_fn=<MseLossBackward>)
output :  tensor([[152240.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(6452394., grad_fn=<MseLossBackward>)
output :  tensor([[181378.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1901339.3750, grad_fn=<MseLossBackward>)
output :  tensor([[142961.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(3846746.7500, grad_fn=<MseLossBackward>)
output :  tensor([[106355.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6751e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136049.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2331e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136158.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1341036.3750, grad_fn=<MseLossBackward>)
output :  tensor([[138131.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2391e+08, grad_fn=<MseLossBackward>)
output :  tensor([[223563.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2063891.3750, grad_fn=<MseLossBackward>)
output :  tensor([[132988.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(546028.6250, grad_fn=<MseLossBackward>)
output :  tensor([[148198.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(642903.3125, grad_fn=<MseLossBackward>)
output :  tensor([[111745.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(64762.2969, grad_fn=<MseLossBackward>)
output :  tensor([[160592.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(351204.3750, grad_fn=<MseLossBackward>)
output :  tensor([[145538.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4465e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192497.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(247179.8750, grad_fn=<MseLossBackward>)
output :  tensor([[134527.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(6042.6328, grad_fn=<MseLossBackward>)
output :  tensor([[114193.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(17581642., grad_fn=<MseLossBackward>)
output :  tensor([[235981.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3927457., grad_fn=<MseLossBackward>)
output :  tensor([[165886.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2661e+09, grad_fn=<MseLossBackward>)
output :  tensor([[154109.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(23917908., grad_fn=<MseLossBackward>)
output :  tensor([[203569.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8538e+10, grad_fn=<MseLossBackward>)
output :  tensor([[245164.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1845e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144290.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(625310.2500, grad_fn=<MseLossBackward>)
output :  tensor([[134548.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(301298.0625, grad_fn=<MseLossBackward>)
output :  tensor([[157411.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(5813976., grad_fn=<MseLossBackward>)
output :  tensor([[135631.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(31711680., grad_fn=<MseLossBackward>)
output :  tensor([[179951.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4077e+09, grad_fn=<MseLossBackward>)
output :  tensor([[185496.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1950517.7500, grad_fn=<MseLossBackward>)
output :  tensor([[167994.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(42173456., grad_fn=<MseLossBackward>)
output :  tensor([[146804.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(14477312., grad_fn=<MseLossBackward>)
output :  tensor([[140902.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2551457.2500, grad_fn=<MseLossBackward>)
output :  tensor([[140894.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(16852436., grad_fn=<MseLossBackward>)
output :  tensor([[173517.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3783e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192271.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1150e+08, grad_fn=<MseLossBackward>)
output :  tensor([[138540.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(4162938.7500, grad_fn=<MseLossBackward>)
output :  tensor([[171204.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(483720.2500, grad_fn=<MseLossBackward>)
output :  tensor([[179313.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2845283.7500, grad_fn=<MseLossBackward>)
output :  tensor([[116685.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2840910.2500, grad_fn=<MseLossBackward>)
output :  tensor([[219243.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(3084908., grad_fn=<MseLossBackward>)
output :  tensor([[178465.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(25349808., grad_fn=<MseLossBackward>)
output :  tensor([[131107.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(31448612., grad_fn=<MseLossBackward>)
output :  tensor([[196261.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(56815.1914, grad_fn=<MseLossBackward>)
output :  tensor([[175769.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(756084.6250, grad_fn=<MseLossBackward>)
output :  tensor([[213700.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9773e+10, grad_fn=<MseLossBackward>)
output :  tensor([[209291.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2917637.7500, grad_fn=<MseLossBackward>)
output :  tensor([[167028.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2981e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195975.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2176685.2500, grad_fn=<MseLossBackward>)
output :  tensor([[109933.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(9405914., grad_fn=<MseLossBackward>)
output :  tensor([[114833.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(5444712., grad_fn=<MseLossBackward>)
output :  tensor([[111401.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(358090.0312, grad_fn=<MseLossBackward>)
output :  tensor([[147619.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(671119.3750, grad_fn=<MseLossBackward>)
output :  tensor([[158194.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4021e+10, grad_fn=<MseLossBackward>)
output :  tensor([[178618.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1907549.3750, grad_fn=<MseLossBackward>)
output :  tensor([[129077.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(2489122.5000, grad_fn=<MseLossBackward>)
output :  tensor([[143524.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2177284.7500, grad_fn=<MseLossBackward>)
output :  tensor([[181266.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1498e+09, grad_fn=<MseLossBackward>)
output :  tensor([[119799.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(8407916., grad_fn=<MseLossBackward>)
output :  tensor([[200340.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(11156226., grad_fn=<MseLossBackward>)
output :  tensor([[142554.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(5979629.5000, grad_fn=<MseLossBackward>)
output :  tensor([[213537.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(406266.8125, grad_fn=<MseLossBackward>)
output :  tensor([[125460.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(290857.9688, grad_fn=<MseLossBackward>)
output :  tensor([[244915.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(11642917., grad_fn=<MseLossBackward>)
output :  tensor([[240511.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9792e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145762.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0629e+08, grad_fn=<MseLossBackward>)
output :  tensor([[84745.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6386e+08, grad_fn=<MseLossBackward>)
output :  tensor([[193704.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5927e+09, grad_fn=<MseLossBackward>)
output :  tensor([[86054.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(25552236., grad_fn=<MseLossBackward>)
output :  tensor([[140036.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(287949.6250, grad_fn=<MseLossBackward>)
output :  tensor([[73948.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2406134.2500, grad_fn=<MseLossBackward>)
output :  tensor([[143986.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1067799.2500, grad_fn=<MseLossBackward>)
output :  tensor([[176883.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(780544.6250, grad_fn=<MseLossBackward>)
output :  tensor([[153078.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(177556.8906, grad_fn=<MseLossBackward>)
output :  tensor([[110869.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(12040412., grad_fn=<MseLossBackward>)
output :  tensor([[205434.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2169e+10, grad_fn=<MseLossBackward>)
output :  tensor([[126798.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2895527.7500, grad_fn=<MseLossBackward>)
output :  tensor([[267856.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4747e+08, grad_fn=<MseLossBackward>)
output :  tensor([[301798.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(67262040., grad_fn=<MseLossBackward>)
output :  tensor([[109796.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(5275312., grad_fn=<MseLossBackward>)
output :  tensor([[171076.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2026663.6250, grad_fn=<MseLossBackward>)
output :  tensor([[132362.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9353e+08, grad_fn=<MseLossBackward>)
output :  tensor([[140981.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(3925723., grad_fn=<MseLossBackward>)
output :  tensor([[132141.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(3578777.2500, grad_fn=<MseLossBackward>)
output :  tensor([[128125.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(9770460., grad_fn=<MseLossBackward>)
output :  tensor([[134851.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4270e+08, grad_fn=<MseLossBackward>)
output :  tensor([[225769.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8900e+10, grad_fn=<MseLossBackward>)
output :  tensor([[191716.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2285e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143721.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(31839.9414, grad_fn=<MseLossBackward>)
output :  tensor([[131416.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(15338483., grad_fn=<MseLossBackward>)
output :  tensor([[112600.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1822626.6250, grad_fn=<MseLossBackward>)
output :  tensor([[255187.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9531e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136616.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2612112.5000, grad_fn=<MseLossBackward>)
output :  tensor([[200275.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(7421368., grad_fn=<MseLossBackward>)
output :  tensor([[98060.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(46773736., grad_fn=<MseLossBackward>)
output :  tensor([[141013.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1131431.1250, grad_fn=<MseLossBackward>)
output :  tensor([[207258.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9728e+08, grad_fn=<MseLossBackward>)
output :  tensor([[183063.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(10004668., grad_fn=<MseLossBackward>)
output :  tensor([[185608.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(370785.8438, grad_fn=<MseLossBackward>)
output :  tensor([[160569.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2031e+10, grad_fn=<MseLossBackward>)
output :  tensor([[300665.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1789e+09, grad_fn=<MseLossBackward>)
output :  tensor([[198401.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(251157.5938, grad_fn=<MseLossBackward>)
output :  tensor([[259777.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0473e+10, grad_fn=<MseLossBackward>)
output :  tensor([[222952.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8531e+09, grad_fn=<MseLossBackward>)
output :  tensor([[284607.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0493e+09, grad_fn=<MseLossBackward>)
output :  tensor([[223864.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(18470.5078, grad_fn=<MseLossBackward>)
output :  tensor([[223193.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8496e+10, grad_fn=<MseLossBackward>)
output :  tensor([[198376.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1895182.3750, grad_fn=<MseLossBackward>)
output :  tensor([[158075.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4540e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134114.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2605097., grad_fn=<MseLossBackward>)
output :  tensor([[134525.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(950137.5625, grad_fn=<MseLossBackward>)
output :  tensor([[91582.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(339115.1562, grad_fn=<MseLossBackward>)
output :  tensor([[112011.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(16095643., grad_fn=<MseLossBackward>)
output :  tensor([[270746.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3818e+09, grad_fn=<MseLossBackward>)
output :  tensor([[231309.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(13616561., grad_fn=<MseLossBackward>)
output :  tensor([[144575.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(179974.8125, grad_fn=<MseLossBackward>)
output :  tensor([[136659.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(707254.7500, grad_fn=<MseLossBackward>)
output :  tensor([[173541.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(36618.4102, grad_fn=<MseLossBackward>)
output :  tensor([[147924.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(7152699.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163592.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(9.5529e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166024.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1050561., grad_fn=<MseLossBackward>)
output :  tensor([[137461.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(213011.0938, grad_fn=<MseLossBackward>)
output :  tensor([[187933.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2815e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113058.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1120951.5000, grad_fn=<MseLossBackward>)
output :  tensor([[168462.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(12510922., grad_fn=<MseLossBackward>)
output :  tensor([[119242.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(574327.1250, grad_fn=<MseLossBackward>)
output :  tensor([[86815.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(33950.9414, grad_fn=<MseLossBackward>)
output :  tensor([[178324.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2808661.7500, grad_fn=<MseLossBackward>)
output :  tensor([[108827.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1150725.5000, grad_fn=<MseLossBackward>)
output :  tensor([[237382.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2617367.7500, grad_fn=<MseLossBackward>)
output :  tensor([[246619.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2621211.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128457.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(1087246.1250, grad_fn=<MseLossBackward>)
output :  tensor([[111383.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(5880435.5000, grad_fn=<MseLossBackward>)
output :  tensor([[285801.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2908e+10, grad_fn=<MseLossBackward>)
output :  tensor([[171046.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(206045.0625, grad_fn=<MseLossBackward>)
output :  tensor([[126416.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2005852.6250, grad_fn=<MseLossBackward>)
output :  tensor([[142060.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7889e+08, grad_fn=<MseLossBackward>)
output :  tensor([[202600.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2995e+08, grad_fn=<MseLossBackward>)
output :  tensor([[139408.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2531828., grad_fn=<MseLossBackward>)
output :  tensor([[159766.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4456e+10, grad_fn=<MseLossBackward>)
output :  tensor([[153131.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(591312.9375, grad_fn=<MseLossBackward>)
output :  tensor([[130517.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(1035004.1875, grad_fn=<MseLossBackward>)
output :  tensor([[248811.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6819e+10, grad_fn=<MseLossBackward>)
output :  tensor([[392635.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(87695032., grad_fn=<MseLossBackward>)
output :  tensor([[112457.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(11952956., grad_fn=<MseLossBackward>)
output :  tensor([[131283.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6342e+08, grad_fn=<MseLossBackward>)
output :  tensor([[158714.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(616249.5625, grad_fn=<MseLossBackward>)
output :  tensor([[131327.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1402e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163746.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3934e+09, grad_fn=<MseLossBackward>)
output :  tensor([[172607.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9196e+09, grad_fn=<MseLossBackward>)
output :  tensor([[101798.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(3244698.5000, grad_fn=<MseLossBackward>)
output :  tensor([[141481.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(232143.2812, grad_fn=<MseLossBackward>)
output :  tensor([[362742.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(20717006., grad_fn=<MseLossBackward>)
output :  tensor([[206247.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2803e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174556.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(890841., grad_fn=<MseLossBackward>)
output :  tensor([[195945.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(48371372., grad_fn=<MseLossBackward>)
output :  tensor([[142395.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(11527086., grad_fn=<MseLossBackward>)
output :  tensor([[189981.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(20416984., grad_fn=<MseLossBackward>)
output :  tensor([[137423.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(8.9543e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181323.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(104399.6719, grad_fn=<MseLossBackward>)
output :  tensor([[237226.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(22782126., grad_fn=<MseLossBackward>)
output :  tensor([[178419.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(19535296., grad_fn=<MseLossBackward>)
output :  tensor([[105993.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(4025227.2500, grad_fn=<MseLossBackward>)
output :  tensor([[263705.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(731078.4375, grad_fn=<MseLossBackward>)
output :  tensor([[253492.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(12199957., grad_fn=<MseLossBackward>)
output :  tensor([[120698.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(5298556.5000, grad_fn=<MseLossBackward>)
output :  tensor([[217685.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2850e+09, grad_fn=<MseLossBackward>)
output :  tensor([[302654.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1282e+08, grad_fn=<MseLossBackward>)
output :  tensor([[208702.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2899357.5000, grad_fn=<MseLossBackward>)
output :  tensor([[214862.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5660e+10, grad_fn=<MseLossBackward>)
output :  tensor([[158943.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1089218.3750, grad_fn=<MseLossBackward>)
output :  tensor([[167376.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(6832751., grad_fn=<MseLossBackward>)
output :  tensor([[163429.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(42217708., grad_fn=<MseLossBackward>)
output :  tensor([[173632.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(13195056., grad_fn=<MseLossBackward>)
output :  tensor([[234359.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1317e+09, grad_fn=<MseLossBackward>)
output :  tensor([[222061.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(54680016., grad_fn=<MseLossBackward>)
output :  tensor([[160396.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7946e+08, grad_fn=<MseLossBackward>)
output :  tensor([[126323.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(11047937., grad_fn=<MseLossBackward>)
output :  tensor([[176911.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(7884.8848, grad_fn=<MseLossBackward>)
output :  tensor([[181885.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1018e+09, grad_fn=<MseLossBackward>)
output :  tensor([[209194.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4382e+10, grad_fn=<MseLossBackward>)
output :  tensor([[135299.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(752881.6250, grad_fn=<MseLossBackward>)
output :  tensor([[151453.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(8.9123e+08, grad_fn=<MseLossBackward>)
output :  tensor([[278070.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1146974.1250, grad_fn=<MseLossBackward>)
output :  tensor([[88937.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(15502553., grad_fn=<MseLossBackward>)
output :  tensor([[235506.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(987259.5625, grad_fn=<MseLossBackward>)
output :  tensor([[258951.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0496e+11, grad_fn=<MseLossBackward>)
output :  tensor([[169904.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(9036.8789, grad_fn=<MseLossBackward>)
output :  tensor([[195194.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5845e+09, grad_fn=<MseLossBackward>)
output :  tensor([[154456.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(295579.0938, grad_fn=<MseLossBackward>)
output :  tensor([[206701.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0067e+09, grad_fn=<MseLossBackward>)
output :  tensor([[128187.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(660880.0625, grad_fn=<MseLossBackward>)
output :  tensor([[145431.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(186151.7969, grad_fn=<MseLossBackward>)
output :  tensor([[169926.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5221e+08, grad_fn=<MseLossBackward>)
output :  tensor([[184939.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(829721.7500, grad_fn=<MseLossBackward>)
output :  tensor([[130405.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(19409118., grad_fn=<MseLossBackward>)
output :  tensor([[137806.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1706289., grad_fn=<MseLossBackward>)
output :  tensor([[175940.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(8649021., grad_fn=<MseLossBackward>)
output :  tensor([[198251.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6779e+09, grad_fn=<MseLossBackward>)
output :  tensor([[239632.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(11339846., grad_fn=<MseLossBackward>)
output :  tensor([[155976.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(953186.1250, grad_fn=<MseLossBackward>)
output :  tensor([[194225.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(3149072., grad_fn=<MseLossBackward>)
output :  tensor([[163513.]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8076e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181036.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2362128.7500, grad_fn=<MseLossBackward>)
output :  tensor([[177816.]], grad_fn=<AddmmBackward>)
loss:  tensor(4343056., grad_fn=<MseLossBackward>)
output :  tensor([[95924.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1157137.2500, grad_fn=<MseLossBackward>)
output :  tensor([[171723.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1724e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134455.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(295953., grad_fn=<MseLossBackward>)
output :  tensor([[122176.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(51501592., grad_fn=<MseLossBackward>)
output :  tensor([[176008.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(4033319., grad_fn=<MseLossBackward>)
output :  tensor([[86615.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(2609360.7500, grad_fn=<MseLossBackward>)
output :  tensor([[284078.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(35066012., grad_fn=<MseLossBackward>)
output :  tensor([[167223.]], grad_fn=<AddmmBackward>)
loss:  tensor(4941729., grad_fn=<MseLossBackward>)
output :  tensor([[190182.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0445e+10, grad_fn=<MseLossBackward>)
output :  tensor([[246843.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8353e+08, grad_fn=<MseLossBackward>)
output :  tensor([[152373.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1887790.1250, grad_fn=<MseLossBackward>)
output :  tensor([[123251.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(559539.0625, grad_fn=<MseLossBackward>)
output :  tensor([[119346.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(306457.3750, grad_fn=<MseLossBackward>)
output :  tensor([[143269.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9917e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174680.]], grad_fn=<AddmmBackward>)
loss:  tensor(462400., grad_fn=<MseLossBackward>)
output :  tensor([[111216.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2461e+08, grad_fn=<MseLossBackward>)
output :  tensor([[211207.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1405e+10, grad_fn=<MseLossBackward>)
output :  tensor([[232331.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(84069984., grad_fn=<MseLossBackward>)
output :  tensor([[254130.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9898e+10, grad_fn=<MseLossBackward>)
output :  tensor([[221722.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9850e+08, grad_fn=<MseLossBackward>)
output :  tensor([[196445.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4174e+10, grad_fn=<MseLossBackward>)
output :  tensor([[186772.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(529574.5625, grad_fn=<MseLossBackward>)
output :  tensor([[205602.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8078e+10, grad_fn=<MseLossBackward>)
output :  tensor([[190062.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1298e+10, grad_fn=<MseLossBackward>)
output :  tensor([[180911.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(4713580., grad_fn=<MseLossBackward>)
output :  tensor([[152508.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(258604.0312, grad_fn=<MseLossBackward>)
output :  tensor([[337807.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(652359.1250, grad_fn=<MseLossBackward>)
output :  tensor([[213355.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1836575.5000, grad_fn=<MseLossBackward>)
output :  tensor([[157695.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(5311584.5000, grad_fn=<MseLossBackward>)
output :  tensor([[189569.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6967e+09, grad_fn=<MseLossBackward>)
output :  tensor([[105433.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(187678.4844, grad_fn=<MseLossBackward>)
output :  tensor([[270511.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0934e+10, grad_fn=<MseLossBackward>)
output :  tensor([[174092.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(37164.6094, grad_fn=<MseLossBackward>)
output :  tensor([[205005.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(72152016., grad_fn=<MseLossBackward>)
output :  tensor([[213286.]], grad_fn=<AddmmBackward>)
loss:  tensor(59505796., grad_fn=<MseLossBackward>)
output :  tensor([[178598.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(361557.9375, grad_fn=<MseLossBackward>)
output :  tensor([[202733.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(872210.0625, grad_fn=<MseLossBackward>)
output :  tensor([[155664.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(441601.7812, grad_fn=<MseLossBackward>)
output :  tensor([[146323.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1458e+09, grad_fn=<MseLossBackward>)
output :  tensor([[118300.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(39909.4258, grad_fn=<MseLossBackward>)
output :  tensor([[139614.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(148501.8438, grad_fn=<MseLossBackward>)
output :  tensor([[147700.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1687807., grad_fn=<MseLossBackward>)
output :  tensor([[202364.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5784e+10, grad_fn=<MseLossBackward>)
output :  tensor([[161559.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(4242892., grad_fn=<MseLossBackward>)
output :  tensor([[102299.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(7835582., grad_fn=<MseLossBackward>)
output :  tensor([[223513.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7181e+08, grad_fn=<MseLossBackward>)
output :  tensor([[184146.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4771e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177432.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(897193.7500, grad_fn=<MseLossBackward>)
output :  tensor([[81430.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(324632.8750, grad_fn=<MseLossBackward>)
output :  tensor([[129822.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(1750225.6250, grad_fn=<MseLossBackward>)
output :  tensor([[214731.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(535412.3125, grad_fn=<MseLossBackward>)
output :  tensor([[143376.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(388771.7500, grad_fn=<MseLossBackward>)
output :  tensor([[130743.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(553489.5000, grad_fn=<MseLossBackward>)
output :  tensor([[146092.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(12196465., grad_fn=<MseLossBackward>)
output :  tensor([[178813.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7068e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145927.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3716340.5000, grad_fn=<MseLossBackward>)
output :  tensor([[158018.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3927271.2500, grad_fn=<MseLossBackward>)
output :  tensor([[214397.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(363175.7188, grad_fn=<MseLossBackward>)
output :  tensor([[138432.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1177e+09, grad_fn=<MseLossBackward>)
output :  tensor([[259088.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(16713149., grad_fn=<MseLossBackward>)
output :  tensor([[160911.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1992729.2500, grad_fn=<MseLossBackward>)
output :  tensor([[126863.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(2678413.5000, grad_fn=<MseLossBackward>)
output :  tensor([[94968.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(963.9084, grad_fn=<MseLossBackward>)
output :  tensor([[151466.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4845e+09, grad_fn=<MseLossBackward>)
output :  tensor([[178467.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2051429.6250, grad_fn=<MseLossBackward>)
output :  tensor([[121034.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(285481.5000, grad_fn=<MseLossBackward>)
output :  tensor([[191559.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3981e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146802.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5297e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150310.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(168908.1562, grad_fn=<MseLossBackward>)
output :  tensor([[189367.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2614992.2500, grad_fn=<MseLossBackward>)
output :  tensor([[255850.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3858e+09, grad_fn=<MseLossBackward>)
output :  tensor([[92805.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1703065.7500, grad_fn=<MseLossBackward>)
output :  tensor([[232682.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(53539632., grad_fn=<MseLossBackward>)
output :  tensor([[127903.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(356250.4375, grad_fn=<MseLossBackward>)
output :  tensor([[166319.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9163e+09, grad_fn=<MseLossBackward>)
output :  tensor([[114824.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1977e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178287.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(5234157.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163569.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8418e+08, grad_fn=<MseLossBackward>)
output :  tensor([[157342.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2054e+08, grad_fn=<MseLossBackward>)
output :  tensor([[239704.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(496606.5000, grad_fn=<MseLossBackward>)
output :  tensor([[226288.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0056e+09, grad_fn=<MseLossBackward>)
output :  tensor([[126514.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(235422.0781, grad_fn=<MseLossBackward>)
output :  tensor([[122341.]], grad_fn=<AddmmBackward>)
loss:  tensor(13388281., grad_fn=<MseLossBackward>)
output :  tensor([[224124.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(8267422., grad_fn=<MseLossBackward>)
output :  tensor([[228708.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(28003114., grad_fn=<MseLossBackward>)
output :  tensor([[229018.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(5375587., grad_fn=<MseLossBackward>)
output :  tensor([[147345.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(429004.5312, grad_fn=<MseLossBackward>)
output :  tensor([[214838.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(23409872., grad_fn=<MseLossBackward>)
output :  tensor([[129157.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(83863672., grad_fn=<MseLossBackward>)
output :  tensor([[136259.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(14134898., grad_fn=<MseLossBackward>)
output :  tensor([[315712.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(508146.2188, grad_fn=<MseLossBackward>)
output :  tensor([[143009.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(4038592.7500, grad_fn=<MseLossBackward>)
output :  tensor([[121306.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9492e+09, grad_fn=<MseLossBackward>)
output :  tensor([[109786.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(82243.4844, grad_fn=<MseLossBackward>)
output :  tensor([[156123.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6818e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181976.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(8.6023e+09, grad_fn=<MseLossBackward>)
output :  tensor([[175634.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(6941496., grad_fn=<MseLossBackward>)
output :  tensor([[193816.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(51602224., grad_fn=<MseLossBackward>)
output :  tensor([[98893.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1224100.2500, grad_fn=<MseLossBackward>)
output :  tensor([[178425.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(330211.8438, grad_fn=<MseLossBackward>)
output :  tensor([[170957.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(9350791., grad_fn=<MseLossBackward>)
output :  tensor([[142251.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(10574285., grad_fn=<MseLossBackward>)
output :  tensor([[262630.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(9.3064e+09, grad_fn=<MseLossBackward>)
output :  tensor([[142478.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3038e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173208.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(43596.1367, grad_fn=<MseLossBackward>)
output :  tensor([[138741.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1584018.8750, grad_fn=<MseLossBackward>)
output :  tensor([[198155.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(5498292., grad_fn=<MseLossBackward>)
output :  tensor([[166815.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(10140344., grad_fn=<MseLossBackward>)
output :  tensor([[242725.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1623354.7500, grad_fn=<MseLossBackward>)
output :  tensor([[134894.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(156000.3125, grad_fn=<MseLossBackward>)
output :  tensor([[150407.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1117513.2500, grad_fn=<MseLossBackward>)
output :  tensor([[212458.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(6458190., grad_fn=<MseLossBackward>)
output :  tensor([[167434.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(5928083.5000, grad_fn=<MseLossBackward>)
output :  tensor([[189506.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(256289.0625, grad_fn=<MseLossBackward>)
output :  tensor([[134350.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0761e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131594.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(6730133., grad_fn=<MseLossBackward>)
output :  tensor([[139822.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(31400.9473, grad_fn=<MseLossBackward>)
output :  tensor([[203713.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3279e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164903.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4903e+09, grad_fn=<MseLossBackward>)
output :  tensor([[73298.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7685e+08, grad_fn=<MseLossBackward>)
output :  tensor([[93730.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(85206600., grad_fn=<MseLossBackward>)
output :  tensor([[254316.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1047776.1250, grad_fn=<MseLossBackward>)
output :  tensor([[202468.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0282e+09, grad_fn=<MseLossBackward>)
output :  tensor([[115907.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(823060.0625, grad_fn=<MseLossBackward>)
output :  tensor([[156967.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(9.3226e+08, grad_fn=<MseLossBackward>)
output :  tensor([[205724.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0378e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179754.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1442e+09, grad_fn=<MseLossBackward>)
output :  tensor([[155654.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(428186.1875, grad_fn=<MseLossBackward>)
output :  tensor([[170315.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(99481.1016, grad_fn=<MseLossBackward>)
output :  tensor([[114362.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(405858.5938, grad_fn=<MseLossBackward>)
output :  tensor([[160867.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(34427188., grad_fn=<MseLossBackward>)
output :  tensor([[191386.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4066e+08, grad_fn=<MseLossBackward>)
output :  tensor([[216292.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(10289059., grad_fn=<MseLossBackward>)
output :  tensor([[244488.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5051e+11, grad_fn=<MseLossBackward>)
output :  tensor([[147654.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(427797.7500, grad_fn=<MseLossBackward>)
output :  tensor([[107558.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(849119.0625, grad_fn=<MseLossBackward>)
output :  tensor([[168800.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7159e+08, grad_fn=<MseLossBackward>)
output :  tensor([[153091.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(6716844., grad_fn=<MseLossBackward>)
output :  tensor([[234070.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(8580048., grad_fn=<MseLossBackward>)
output :  tensor([[117007.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(4030840.5000, grad_fn=<MseLossBackward>)
output :  tensor([[182571.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(107840.4062, grad_fn=<MseLossBackward>)
output :  tensor([[187347.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(419681.2812, grad_fn=<MseLossBackward>)
output :  tensor([[161660.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5071e+10, grad_fn=<MseLossBackward>)
output :  tensor([[93652.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6010e+08, grad_fn=<MseLossBackward>)
output :  tensor([[239258.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(67072.9062, grad_fn=<MseLossBackward>)
output :  tensor([[175015.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(968655.8125, grad_fn=<MseLossBackward>)
output :  tensor([[140002.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4202, grad_fn=<MseLossBackward>)
output :  tensor([[234344.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(430110.5312, grad_fn=<MseLossBackward>)
output :  tensor([[158139.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(23620208., grad_fn=<MseLossBackward>)
output :  tensor([[202425.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5024e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134243.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(572528.6875, grad_fn=<MseLossBackward>)
output :  tensor([[184910.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2491e+08, grad_fn=<MseLossBackward>)
output :  tensor([[138493.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(6216451.5000, grad_fn=<MseLossBackward>)
output :  tensor([[228700.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(53287720., grad_fn=<MseLossBackward>)
output :  tensor([[223174.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1959e+08, grad_fn=<MseLossBackward>)
output :  tensor([[94127.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(17035870., grad_fn=<MseLossBackward>)
output :  tensor([[158919.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(264806.7188, grad_fn=<MseLossBackward>)
output :  tensor([[247964.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5108e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143795.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1450331., grad_fn=<MseLossBackward>)
output :  tensor([[111264.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9593e+09, grad_fn=<MseLossBackward>)
output :  tensor([[165864.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1862457.2500, grad_fn=<MseLossBackward>)
output :  tensor([[143341.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(433416.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128947.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(558394.2500, grad_fn=<MseLossBackward>)
output :  tensor([[189357.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8501e+09, grad_fn=<MseLossBackward>)
output :  tensor([[121748.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(564341.3750, grad_fn=<MseLossBackward>)
output :  tensor([[148698.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(10899077., grad_fn=<MseLossBackward>)
output :  tensor([[169923.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(3336844.2500, grad_fn=<MseLossBackward>)
output :  tensor([[151249.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(62024.3477, grad_fn=<MseLossBackward>)
output :  tensor([[158311.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(21053328., grad_fn=<MseLossBackward>)
output :  tensor([[137156.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9279e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130297.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(2900182.5000, grad_fn=<MseLossBackward>)
output :  tensor([[154540.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4151e+08, grad_fn=<MseLossBackward>)
output :  tensor([[146070.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(3679143.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163266.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2299156.2500, grad_fn=<MseLossBackward>)
output :  tensor([[139433.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7223e+08, grad_fn=<MseLossBackward>)
output :  tensor([[153008.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(17712918., grad_fn=<MseLossBackward>)
output :  tensor([[188585.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(342993.2500, grad_fn=<MseLossBackward>)
output :  tensor([[168395.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(365099.1875, grad_fn=<MseLossBackward>)
output :  tensor([[178044.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(3825324.7500, grad_fn=<MseLossBackward>)
output :  tensor([[219149.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(724014.8750, grad_fn=<MseLossBackward>)
output :  tensor([[111408.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(12311381., grad_fn=<MseLossBackward>)
output :  tensor([[136627.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3754e+08, grad_fn=<MseLossBackward>)
output :  tensor([[285380.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(383470.5625, grad_fn=<MseLossBackward>)
output :  tensor([[114810.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1415133.2500, grad_fn=<MseLossBackward>)
output :  tensor([[176608.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8829e+09, grad_fn=<MseLossBackward>)
output :  tensor([[183193.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(3262708.5000, grad_fn=<MseLossBackward>)
output :  tensor([[173813.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3657e+08, grad_fn=<MseLossBackward>)
output :  tensor([[248340.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1073e+08, grad_fn=<MseLossBackward>)
output :  tensor([[223938.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(3756570.7500, grad_fn=<MseLossBackward>)
output :  tensor([[126615.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2915e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175064.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8685e+08, grad_fn=<MseLossBackward>)
output :  tensor([[124591.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(349946.1875, grad_fn=<MseLossBackward>)
output :  tensor([[182656.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5599e+10, grad_fn=<MseLossBackward>)
output :  tensor([[149410.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(12887203., grad_fn=<MseLossBackward>)
output :  tensor([[153989.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(56090268., grad_fn=<MseLossBackward>)
output :  tensor([[203144.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(9956884., grad_fn=<MseLossBackward>)
output :  tensor([[144559.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4543e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176189.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(36052.5156, grad_fn=<MseLossBackward>)
output :  tensor([[252561.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2567e+08, grad_fn=<MseLossBackward>)
output :  tensor([[147736.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(69539.3359, grad_fn=<MseLossBackward>)
output :  tensor([[204122.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2125035., grad_fn=<MseLossBackward>)
output :  tensor([[157237.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(7357995.5000, grad_fn=<MseLossBackward>)
output :  tensor([[122622.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1987e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136416.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(444659.7500, grad_fn=<MseLossBackward>)
output :  tensor([[181570.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(5903381.5000, grad_fn=<MseLossBackward>)
output :  tensor([[194879.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(23805404., grad_fn=<MseLossBackward>)
output :  tensor([[232826.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1554e+09, grad_fn=<MseLossBackward>)
output :  tensor([[254596.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(5776136.5000, grad_fn=<MseLossBackward>)
output :  tensor([[187119.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7393e+10, grad_fn=<MseLossBackward>)
output :  tensor([[142655.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6168e+09, grad_fn=<MseLossBackward>)
output :  tensor([[148332.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(14689014., grad_fn=<MseLossBackward>)
output :  tensor([[71614.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9947e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136476.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2179037.2500, grad_fn=<MseLossBackward>)
output :  tensor([[134256.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(28695440., grad_fn=<MseLossBackward>)
output :  tensor([[154547.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(299585.1875, grad_fn=<MseLossBackward>)
output :  tensor([[130146.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(9901347., grad_fn=<MseLossBackward>)
output :  tensor([[74508.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(3967877.2500, grad_fn=<MseLossBackward>)
output :  tensor([[82134.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(17966.4707, grad_fn=<MseLossBackward>)
output :  tensor([[227811.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(17539736., grad_fn=<MseLossBackward>)
output :  tensor([[140654.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9269e+08, grad_fn=<MseLossBackward>)
output :  tensor([[127487.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(9073462., grad_fn=<MseLossBackward>)
output :  tensor([[171846.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(23489774., grad_fn=<MseLossBackward>)
output :  tensor([[232194.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(7871882.5000, grad_fn=<MseLossBackward>)
output :  tensor([[191117.]], grad_fn=<AddmmBackward>)
loss:  tensor(1046529., grad_fn=<MseLossBackward>)
output :  tensor([[154827.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1373840.3750, grad_fn=<MseLossBackward>)
output :  tensor([[202658.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(22646594., grad_fn=<MseLossBackward>)
output :  tensor([[202440.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1944e+09, grad_fn=<MseLossBackward>)
output :  tensor([[135030.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(3879238., grad_fn=<MseLossBackward>)
output :  tensor([[152873.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(4522733.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135758.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(58261.8906, grad_fn=<MseLossBackward>)
output :  tensor([[200216.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8705e+08, grad_fn=<MseLossBackward>)
output :  tensor([[152881.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1250413.1250, grad_fn=<MseLossBackward>)
output :  tensor([[139382.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1052e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144470.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(184148.2656, grad_fn=<MseLossBackward>)
output :  tensor([[212383.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(147192.1250, grad_fn=<MseLossBackward>)
output :  tensor([[99864.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1916e+08, grad_fn=<MseLossBackward>)
output :  tensor([[167622.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(15121.3135, grad_fn=<MseLossBackward>)
output :  tensor([[127997.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(8.9532, grad_fn=<MseLossBackward>)
output :  tensor([[147811.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(658430.8125, grad_fn=<MseLossBackward>)
output :  tensor([[105434.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8534e+09, grad_fn=<MseLossBackward>)
output :  tensor([[140412.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(8483384., grad_fn=<MseLossBackward>)
output :  tensor([[234282.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2948840.2500, grad_fn=<MseLossBackward>)
output :  tensor([[144593.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(165153.3438, grad_fn=<MseLossBackward>)
output :  tensor([[138962.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2138083.7500, grad_fn=<MseLossBackward>)
output :  tensor([[164419.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3263e+09, grad_fn=<MseLossBackward>)
output :  tensor([[271039.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(48450736., grad_fn=<MseLossBackward>)
output :  tensor([[176377.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1896903.6250, grad_fn=<MseLossBackward>)
output :  tensor([[106686.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(15295677., grad_fn=<MseLossBackward>)
output :  tensor([[202323.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6515e+09, grad_fn=<MseLossBackward>)
output :  tensor([[154897.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(16831404., grad_fn=<MseLossBackward>)
output :  tensor([[164902.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5166e+10, grad_fn=<MseLossBackward>)
output :  tensor([[97245.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1111805.5000, grad_fn=<MseLossBackward>)
output :  tensor([[125154.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2416567.5000, grad_fn=<MseLossBackward>)
output :  tensor([[154646.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1831370.1250, grad_fn=<MseLossBackward>)
output :  tensor([[142283.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(5213088., grad_fn=<MseLossBackward>)
output :  tensor([[199084.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(838283.3125, grad_fn=<MseLossBackward>)
output :  tensor([[142348.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(121452.2500, grad_fn=<MseLossBackward>)
output :  tensor([[266422.]], grad_fn=<AddmmBackward>)
loss:  tensor(17156164., grad_fn=<MseLossBackward>)
output :  tensor([[128914.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2899e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163909.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2528199.5000, grad_fn=<MseLossBackward>)
output :  tensor([[188534.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1166.6494, grad_fn=<MseLossBackward>)
output :  tensor([[122538.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5720e+08, grad_fn=<MseLossBackward>)
output :  tensor([[255633.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(31736850., grad_fn=<MseLossBackward>)
output :  tensor([[159252.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6992e+08, grad_fn=<MseLossBackward>)
output :  tensor([[245041.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(95413.4219, grad_fn=<MseLossBackward>)
output :  tensor([[139267.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(22392268., grad_fn=<MseLossBackward>)
output :  tensor([[210112.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(12758.4082, grad_fn=<MseLossBackward>)
output :  tensor([[178569.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(38059644., grad_fn=<MseLossBackward>)
output :  tensor([[154170.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(29235.6562, grad_fn=<MseLossBackward>)
output :  tensor([[118793.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(629196., grad_fn=<MseLossBackward>)
output :  tensor([[239601.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2551e+09, grad_fn=<MseLossBackward>)
output :  tensor([[239606.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(154977.5469, grad_fn=<MseLossBackward>)
output :  tensor([[155450.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4464835., grad_fn=<MseLossBackward>)
output :  tensor([[252816.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(4340191., grad_fn=<MseLossBackward>)
output :  tensor([[121956.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(55533236., grad_fn=<MseLossBackward>)
output :  tensor([[175832.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(28066.7188, grad_fn=<MseLossBackward>)
output :  tensor([[156668.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(11099933., grad_fn=<MseLossBackward>)
output :  tensor([[137801.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(46266780., grad_fn=<MseLossBackward>)
output :  tensor([[196388.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4741e+09, grad_fn=<MseLossBackward>)
output :  tensor([[162959.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1083616., grad_fn=<MseLossBackward>)
output :  tensor([[163608.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(370481.4375, grad_fn=<MseLossBackward>)
output :  tensor([[157870.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(16721.7227, grad_fn=<MseLossBackward>)
output :  tensor([[143147.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(45601952., grad_fn=<MseLossBackward>)
output :  tensor([[170220.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6870e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161695.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2873131., grad_fn=<MseLossBackward>)
output :  tensor([[377492.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(41958412., grad_fn=<MseLossBackward>)
output :  tensor([[134599.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(57755488., grad_fn=<MseLossBackward>)
output :  tensor([[131749.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1390e+09, grad_fn=<MseLossBackward>)
output :  tensor([[276308.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(24053508., grad_fn=<MseLossBackward>)
output :  tensor([[161535.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(215905.4375, grad_fn=<MseLossBackward>)
output :  tensor([[129473.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(80525664., grad_fn=<MseLossBackward>)
output :  tensor([[229241.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(7607770.5000, grad_fn=<MseLossBackward>)
output :  tensor([[180736.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(55969.2109, grad_fn=<MseLossBackward>)
output :  tensor([[157355.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(28679038., grad_fn=<MseLossBackward>)
output :  tensor([[147690.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(7237865.5000, grad_fn=<MseLossBackward>)
output :  tensor([[156362.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7879e+08, grad_fn=<MseLossBackward>)
output :  tensor([[100393.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(154780.7656, grad_fn=<MseLossBackward>)
output :  tensor([[73807.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9063e+08, grad_fn=<MseLossBackward>)
output :  tensor([[161524.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(12077906., grad_fn=<MseLossBackward>)
output :  tensor([[189866.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4542e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161308.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(10944208., grad_fn=<MseLossBackward>)
output :  tensor([[156945.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(307175.7500, grad_fn=<MseLossBackward>)
output :  tensor([[138784.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1780306.5000, grad_fn=<MseLossBackward>)
output :  tensor([[203251.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(7281227.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139288.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1661198.7500, grad_fn=<MseLossBackward>)
output :  tensor([[183329.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6046e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144399.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2562600.7500, grad_fn=<MseLossBackward>)
output :  tensor([[109607.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0798e+08, grad_fn=<MseLossBackward>)
output :  tensor([[96543.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(6469829.5000, grad_fn=<MseLossBackward>)
output :  tensor([[174894.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(11123.6572, grad_fn=<MseLossBackward>)
output :  tensor([[262675.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(5176051.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139174.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(5409840., grad_fn=<MseLossBackward>)
output :  tensor([[159984.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(7959.9854, grad_fn=<MseLossBackward>)
output :  tensor([[132813.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(98017.9141, grad_fn=<MseLossBackward>)
output :  tensor([[148047.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2109620., grad_fn=<MseLossBackward>)
output :  tensor([[166337.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2442871.2500, grad_fn=<MseLossBackward>)
output :  tensor([[128390.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(1934076.8750, grad_fn=<MseLossBackward>)
output :  tensor([[172832.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7465e+08, grad_fn=<MseLossBackward>)
output :  tensor([[159038.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(4156119.2500, grad_fn=<MseLossBackward>)
output :  tensor([[119520.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(9125639., grad_fn=<MseLossBackward>)
output :  tensor([[161286.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1428e+09, grad_fn=<MseLossBackward>)
output :  tensor([[55011.4258]], grad_fn=<AddmmBackward>)
loss:  tensor(9068685., grad_fn=<MseLossBackward>)
output :  tensor([[233983.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1648e+09, grad_fn=<MseLossBackward>)
output :  tensor([[201488.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(238952.9375, grad_fn=<MseLossBackward>)
output :  tensor([[182968.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(4128389., grad_fn=<MseLossBackward>)
output :  tensor([[107132.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(1281937., grad_fn=<MseLossBackward>)
output :  tensor([[88459.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2129045.7500, grad_fn=<MseLossBackward>)
output :  tensor([[139246.]], grad_fn=<AddmmBackward>)
loss:  tensor(568516., grad_fn=<MseLossBackward>)
output :  tensor([[222325.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1372e+09, grad_fn=<MseLossBackward>)
output :  tensor([[204970.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(6400663., grad_fn=<MseLossBackward>)
output :  tensor([[167235.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4999277., grad_fn=<MseLossBackward>)
output :  tensor([[175270.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0513e+09, grad_fn=<MseLossBackward>)
output :  tensor([[188289.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2927360.5000, grad_fn=<MseLossBackward>)
output :  tensor([[91920.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(24209476., grad_fn=<MseLossBackward>)
output :  tensor([[139584.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(172783.1094, grad_fn=<MseLossBackward>)
output :  tensor([[112053.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2413556.5000, grad_fn=<MseLossBackward>)
output :  tensor([[147591.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3530e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173991.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8483e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194052.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1984e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181604.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2574019.2500, grad_fn=<MseLossBackward>)
output :  tensor([[96125.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(140519.5469, grad_fn=<MseLossBackward>)
output :  tensor([[119394.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(3587413.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162083.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8035e+08, grad_fn=<MseLossBackward>)
output :  tensor([[201196.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1430715., grad_fn=<MseLossBackward>)
output :  tensor([[146553.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(6522277.5000, grad_fn=<MseLossBackward>)
train_loss: [2.5922857e+09]
epoch_result tensor([0.])
output :  tensor([[158236.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(69242.9922, grad_fn=<MseLossBackward>)
output :  tensor([[121291.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(502658.8438, grad_fn=<MseLossBackward>)
output :  tensor([[195449.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1559103.3750, grad_fn=<MseLossBackward>)
output :  tensor([[175055.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3780472.5000, grad_fn=<MseLossBackward>)
output :  tensor([[152581.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4610e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128492.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(242087.0625, grad_fn=<MseLossBackward>)
output :  tensor([[140416.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(340217.0312, grad_fn=<MseLossBackward>)
output :  tensor([[120067.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1140590.6250, grad_fn=<MseLossBackward>)
output :  tensor([[66927.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(71019592., grad_fn=<MseLossBackward>)
output :  tensor([[165980.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(377.8164, grad_fn=<MseLossBackward>)
output :  tensor([[145812.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(33788424., grad_fn=<MseLossBackward>)
output :  tensor([[225354.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(125847.5625, grad_fn=<MseLossBackward>)
output :  tensor([[168593.]], grad_fn=<AddmmBackward>)
loss:  tensor(165649., grad_fn=<MseLossBackward>)
output :  tensor([[246126.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(12770014., grad_fn=<MseLossBackward>)
output :  tensor([[53916.4180]], grad_fn=<AddmmBackward>)
loss:  tensor(1174150., grad_fn=<MseLossBackward>)
output :  tensor([[162237.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1462e+08, grad_fn=<MseLossBackward>)
output :  tensor([[168230.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(45832264., grad_fn=<MseLossBackward>)
output :  tensor([[167332.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1733e+08, grad_fn=<MseLossBackward>)
output :  tensor([[273034.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(3862330.5000, grad_fn=<MseLossBackward>)
output :  tensor([[197197.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(39086.5273, grad_fn=<MseLossBackward>)
output :  tensor([[138944.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4832e+10, grad_fn=<MseLossBackward>)
output :  tensor([[197103.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(10397703., grad_fn=<MseLossBackward>)
output :  tensor([[179715.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0417e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150179.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(673861.4375, grad_fn=<MseLossBackward>)
output :  tensor([[177551.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(57024680., grad_fn=<MseLossBackward>)
output :  tensor([[83234.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(4691387., grad_fn=<MseLossBackward>)
output :  tensor([[171051.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3700e+09, grad_fn=<MseLossBackward>)
output :  tensor([[188394.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(11519872., grad_fn=<MseLossBackward>)
output :  tensor([[207569.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2974e+09, grad_fn=<MseLossBackward>)
output :  tensor([[111431.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(2048096.3750, grad_fn=<MseLossBackward>)
output :  tensor([[170511.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(238510.1406, grad_fn=<MseLossBackward>)
output :  tensor([[139594.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(9578735., grad_fn=<MseLossBackward>)
output :  tensor([[130223.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1497793.5000, grad_fn=<MseLossBackward>)
output :  tensor([[120764.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(1598703.3750, grad_fn=<MseLossBackward>)
output :  tensor([[147914.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(9.5570e+08, grad_fn=<MseLossBackward>)
output :  tensor([[168600.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1433e+10, grad_fn=<MseLossBackward>)
output :  tensor([[151168.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2156354.5000, grad_fn=<MseLossBackward>)
output :  tensor([[182260.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(5109860., grad_fn=<MseLossBackward>)
output :  tensor([[144016.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(9098612., grad_fn=<MseLossBackward>)
output :  tensor([[106905.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8580e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136610.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1449e+09, grad_fn=<MseLossBackward>)
output :  tensor([[129808.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(26954350., grad_fn=<MseLossBackward>)
output :  tensor([[137496.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1017e+08, grad_fn=<MseLossBackward>)
output :  tensor([[226669.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2785926., grad_fn=<MseLossBackward>)
output :  tensor([[132320.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(4915.3242, grad_fn=<MseLossBackward>)
output :  tensor([[152139.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(9856951., grad_fn=<MseLossBackward>)
output :  tensor([[116872.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(23738668., grad_fn=<MseLossBackward>)
output :  tensor([[159544.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(207238.3438, grad_fn=<MseLossBackward>)
output :  tensor([[146701.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3328e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193457.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2123577.5000, grad_fn=<MseLossBackward>)
output :  tensor([[136347.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3602107.5000, grad_fn=<MseLossBackward>)
output :  tensor([[98915.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2286e+08, grad_fn=<MseLossBackward>)
output :  tensor([[230964.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(9214640., grad_fn=<MseLossBackward>)
output :  tensor([[165737.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2803e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159326.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(106357.5156, grad_fn=<MseLossBackward>)
output :  tensor([[204655.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8172e+10, grad_fn=<MseLossBackward>)
output :  tensor([[244394.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2013e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143552.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2782.5625, grad_fn=<MseLossBackward>)
output :  tensor([[135905.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(3631228., grad_fn=<MseLossBackward>)
output :  tensor([[154392.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(368923.3750, grad_fn=<MseLossBackward>)
output :  tensor([[132796.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(7818839.5000, grad_fn=<MseLossBackward>)
output :  tensor([[179785.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4343e+09, grad_fn=<MseLossBackward>)
output :  tensor([[181960.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(4579265.5000, grad_fn=<MseLossBackward>)
output :  tensor([[165599.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(16807950., grad_fn=<MseLossBackward>)
output :  tensor([[135244.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(60150688., grad_fn=<MseLossBackward>)
output :  tensor([[141916.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(340344.6250, grad_fn=<MseLossBackward>)
output :  tensor([[147255.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(5089113., grad_fn=<MseLossBackward>)
output :  tensor([[173303.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4066e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195616.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5727e+08, grad_fn=<MseLossBackward>)
output :  tensor([[139729.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(10426542., grad_fn=<MseLossBackward>)
output :  tensor([[178595.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(44828676., grad_fn=<MseLossBackward>)
output :  tensor([[176092.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(24081410., grad_fn=<MseLossBackward>)
output :  tensor([[116261.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1591540., grad_fn=<MseLossBackward>)
output :  tensor([[215696.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(28123300., grad_fn=<MseLossBackward>)
output :  tensor([[184842.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1801844.7500, grad_fn=<MseLossBackward>)
output :  tensor([[125223.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(76413.3750, grad_fn=<MseLossBackward>)
output :  tensor([[198082.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2503218.5000, grad_fn=<MseLossBackward>)
output :  tensor([[176342.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2081257., grad_fn=<MseLossBackward>)
output :  tensor([[209915.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1094e+10, grad_fn=<MseLossBackward>)
output :  tensor([[209547.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2109756.2500, grad_fn=<MseLossBackward>)
output :  tensor([[165410.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1841e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192714.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(3187842.7500, grad_fn=<MseLossBackward>)
output :  tensor([[113440.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(194377.6562, grad_fn=<MseLossBackward>)
output :  tensor([[116246.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(14039541., grad_fn=<MseLossBackward>)
output :  tensor([[112507.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(257445.2500, grad_fn=<MseLossBackward>)
output :  tensor([[146444.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(126502.4844, grad_fn=<MseLossBackward>)
output :  tensor([[160280.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3256e+10, grad_fn=<MseLossBackward>)
output :  tensor([[180005.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(33.2424, grad_fn=<MseLossBackward>)
output :  tensor([[126420.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1165893.7500, grad_fn=<MseLossBackward>)
output :  tensor([[145067.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(4562.5801, grad_fn=<MseLossBackward>)
output :  tensor([[182559.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2714e+09, grad_fn=<MseLossBackward>)
output :  tensor([[117100.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(40150.1406, grad_fn=<MseLossBackward>)
output :  tensor([[192924.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(16606134., grad_fn=<MseLossBackward>)
output :  tensor([[146974.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(3898835.2500, grad_fn=<MseLossBackward>)
output :  tensor([[209346.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(12625586., grad_fn=<MseLossBackward>)
output :  tensor([[127552.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(2411008.2500, grad_fn=<MseLossBackward>)
output :  tensor([[249568.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1539576.8750, grad_fn=<MseLossBackward>)
output :  tensor([[241305.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9092e+09, grad_fn=<MseLossBackward>)
output :  tensor([[147321.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5349e+08, grad_fn=<MseLossBackward>)
output :  tensor([[85303.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9067e+08, grad_fn=<MseLossBackward>)
output :  tensor([[193980.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5480e+09, grad_fn=<MseLossBackward>)
output :  tensor([[79798.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(1443921.3750, grad_fn=<MseLossBackward>)
output :  tensor([[139372.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(16300.1074, grad_fn=<MseLossBackward>)
output :  tensor([[76890.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1934011.7500, grad_fn=<MseLossBackward>)
output :  tensor([[142584.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(135700.1406, grad_fn=<MseLossBackward>)
output :  tensor([[175066.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(871130.5625, grad_fn=<MseLossBackward>)
output :  tensor([[154245.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(555420.8750, grad_fn=<MseLossBackward>)
output :  tensor([[108650.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(1563496.2500, grad_fn=<MseLossBackward>)
output :  tensor([[205551.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2144e+10, grad_fn=<MseLossBackward>)
output :  tensor([[127570.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(864696.5625, grad_fn=<MseLossBackward>)
output :  tensor([[267339.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6030e+08, grad_fn=<MseLossBackward>)
output :  tensor([[301427.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(73493112., grad_fn=<MseLossBackward>)
output :  tensor([[107936.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(190150.5000, grad_fn=<MseLossBackward>)
output :  tensor([[170361.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(4572714.5000, grad_fn=<MseLossBackward>)
output :  tensor([[134049.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7857e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128024.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2047e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129135.4922]], grad_fn=<AddmmBackward>)
loss:  tensor(1242127.6250, grad_fn=<MseLossBackward>)
output :  tensor([[126983.4922]], grad_fn=<AddmmBackward>)
loss:  tensor(3934241.2500, grad_fn=<MseLossBackward>)
output :  tensor([[134863.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4332e+08, grad_fn=<MseLossBackward>)
output :  tensor([[226437.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8637e+10, grad_fn=<MseLossBackward>)
output :  tensor([[190945.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2516e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145205.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1704085.5000, grad_fn=<MseLossBackward>)
output :  tensor([[126053.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(2093696., grad_fn=<MseLossBackward>)
output :  tensor([[111480.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(53281.6250, grad_fn=<MseLossBackward>)
output :  tensor([[257354.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6852e+09, grad_fn=<MseLossBackward>)
output :  tensor([[135902.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(814703.6875, grad_fn=<MseLossBackward>)
output :  tensor([[206034.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(9209992., grad_fn=<MseLossBackward>)
output :  tensor([[103694.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(1454266.3750, grad_fn=<MseLossBackward>)
output :  tensor([[138409.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2371744.5000, grad_fn=<MseLossBackward>)
output :  tensor([[209384.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2848e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179419.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(230790.1719, grad_fn=<MseLossBackward>)
output :  tensor([[184876.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(15252.2500, grad_fn=<MseLossBackward>)
output :  tensor([[161520.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1750e+10, grad_fn=<MseLossBackward>)
output :  tensor([[300573.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1852e+09, grad_fn=<MseLossBackward>)
output :  tensor([[196976.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(853545., grad_fn=<MseLossBackward>)
output :  tensor([[261594.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9956e+10, grad_fn=<MseLossBackward>)
output :  tensor([[219800.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1344e+09, grad_fn=<MseLossBackward>)
output :  tensor([[285567.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(9.8802e+08, grad_fn=<MseLossBackward>)
output :  tensor([[224899.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(808959.6875, grad_fn=<MseLossBackward>)
output :  tensor([[223282.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8466e+10, grad_fn=<MseLossBackward>)
output :  tensor([[196727.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(74315.8750, grad_fn=<MseLossBackward>)
output :  tensor([[160075.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6569e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131971.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(279527., grad_fn=<MseLossBackward>)
output :  tensor([[136591.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1190997.1250, grad_fn=<MseLossBackward>)
output :  tensor([[90381.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(383044.9375, grad_fn=<MseLossBackward>)
output :  tensor([[108507.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(257564.1875, grad_fn=<MseLossBackward>)
output :  tensor([[272634.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1658e+09, grad_fn=<MseLossBackward>)
output :  tensor([[236939.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(3760569.2500, grad_fn=<MseLossBackward>)
output :  tensor([[146313.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1724625.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138152.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(425328.1562, grad_fn=<MseLossBackward>)
output :  tensor([[171098.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(6942813.5000, grad_fn=<MseLossBackward>)
output :  tensor([[146266.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1032287.7500, grad_fn=<MseLossBackward>)
output :  tensor([[166117.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0554e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165932.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(869672.8125, grad_fn=<MseLossBackward>)
output :  tensor([[135126.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3510002.2500, grad_fn=<MseLossBackward>)
output :  tensor([[189725.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5192e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113970.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3884779.5000, grad_fn=<MseLossBackward>)
output :  tensor([[168894.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(9644518., grad_fn=<MseLossBackward>)
output :  tensor([[122316.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(5367439., grad_fn=<MseLossBackward>)
output :  tensor([[91840.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(23435130., grad_fn=<MseLossBackward>)
output :  tensor([[181078.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1162825.2500, grad_fn=<MseLossBackward>)
output :  tensor([[111933.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(4136933.5000, grad_fn=<MseLossBackward>)
output :  tensor([[240391.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1937446.5000, grad_fn=<MseLossBackward>)
output :  tensor([[249924.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(24251008., grad_fn=<MseLossBackward>)
output :  tensor([[132087.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(6694105., grad_fn=<MseLossBackward>)
output :  tensor([[106126.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(8021640., grad_fn=<MseLossBackward>)
output :  tensor([[291852.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1113e+10, grad_fn=<MseLossBackward>)
output :  tensor([[173759.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(5104705., grad_fn=<MseLossBackward>)
output :  tensor([[125906.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(821487.3125, grad_fn=<MseLossBackward>)
output :  tensor([[144588.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0697e+08, grad_fn=<MseLossBackward>)
output :  tensor([[202159.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4020e+08, grad_fn=<MseLossBackward>)
output :  tensor([[143879.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(8289271., grad_fn=<MseLossBackward>)
output :  tensor([[156089.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5354e+10, grad_fn=<MseLossBackward>)
output :  tensor([[156888.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(8933280., grad_fn=<MseLossBackward>)
output :  tensor([[128996.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(253433.5781, grad_fn=<MseLossBackward>)
output :  tensor([[249601.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6615e+10, grad_fn=<MseLossBackward>)
output :  tensor([[400385.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2607316.7500, grad_fn=<MseLossBackward>)
output :  tensor([[110090.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(1189411.7500, grad_fn=<MseLossBackward>)
output :  tensor([[119597.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1204129., grad_fn=<MseLossBackward>)
output :  tensor([[156910.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(6705510., grad_fn=<MseLossBackward>)
output :  tensor([[131034.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2741e+08, grad_fn=<MseLossBackward>)
output :  tensor([[160608.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7690e+09, grad_fn=<MseLossBackward>)
output :  tensor([[171257.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7524e+09, grad_fn=<MseLossBackward>)
output :  tensor([[104971.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(1881162.2500, grad_fn=<MseLossBackward>)
output :  tensor([[138057.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(8659778., grad_fn=<MseLossBackward>)
output :  tensor([[366675.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(382001.2500, grad_fn=<MseLossBackward>)
output :  tensor([[206174.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2873e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173890.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2589434., grad_fn=<MseLossBackward>)
output :  tensor([[203602.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(493462.3438, grad_fn=<MseLossBackward>)
output :  tensor([[137123.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3521252.2500, grad_fn=<MseLossBackward>)
output :  tensor([[193816.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(466681.1250, grad_fn=<MseLossBackward>)
output :  tensor([[134867.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4897e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176247.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(22590266., grad_fn=<MseLossBackward>)
output :  tensor([[240750.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1562148.5000, grad_fn=<MseLossBackward>)
output :  tensor([[172273.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2982367., grad_fn=<MseLossBackward>)
output :  tensor([[111260.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(10633459., grad_fn=<MseLossBackward>)
output :  tensor([[265762.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1444728.8750, grad_fn=<MseLossBackward>)
output :  tensor([[251914.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3666686.5000, grad_fn=<MseLossBackward>)
output :  tensor([[121585.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(2002114.5000, grad_fn=<MseLossBackward>)
output :  tensor([[213765.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7496e+09, grad_fn=<MseLossBackward>)
output :  tensor([[306262.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6244e+08, grad_fn=<MseLossBackward>)
output :  tensor([[206649.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(122653.1719, grad_fn=<MseLossBackward>)
output :  tensor([[216230.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5319e+10, grad_fn=<MseLossBackward>)
output :  tensor([[158584.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(469010.9688, grad_fn=<MseLossBackward>)
output :  tensor([[169026.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(927760.2500, grad_fn=<MseLossBackward>)
output :  tensor([[160563.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(13191084., grad_fn=<MseLossBackward>)
output :  tensor([[166421.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(12806445., grad_fn=<MseLossBackward>)
output :  tensor([[237108.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(9.5429e+08, grad_fn=<MseLossBackward>)
output :  tensor([[222013.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(55386852., grad_fn=<MseLossBackward>)
output :  tensor([[161777.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1838e+08, grad_fn=<MseLossBackward>)
output :  tensor([[123463.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(214803.2812, grad_fn=<MseLossBackward>)
output :  tensor([[178852.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(3431293.2500, grad_fn=<MseLossBackward>)
output :  tensor([[178155.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6986e+09, grad_fn=<MseLossBackward>)
output :  tensor([[209906.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4118e+10, grad_fn=<MseLossBackward>)
output :  tensor([[135005.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(328436.4375, grad_fn=<MseLossBackward>)
output :  tensor([[150153.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1531e+08, grad_fn=<MseLossBackward>)
output :  tensor([[278108.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1228495.1250, grad_fn=<MseLossBackward>)
output :  tensor([[88531.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(12469451., grad_fn=<MseLossBackward>)
output :  tensor([[234556.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(3778650., grad_fn=<MseLossBackward>)
output :  tensor([[255646.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0712e+11, grad_fn=<MseLossBackward>)
output :  tensor([[169879.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(14501.4277, grad_fn=<MseLossBackward>)
output :  tensor([[195146.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5883e+09, grad_fn=<MseLossBackward>)
output :  tensor([[153415.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2512126., grad_fn=<MseLossBackward>)
output :  tensor([[206108.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0821e+09, grad_fn=<MseLossBackward>)
output :  tensor([[130488.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2216981.5000, grad_fn=<MseLossBackward>)
output :  tensor([[146767.]], grad_fn=<AddmmBackward>)
loss:  tensor(3122289., grad_fn=<MseLossBackward>)
output :  tensor([[168343.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6789e+08, grad_fn=<MseLossBackward>)
output :  tensor([[186494.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(415138.5938, grad_fn=<MseLossBackward>)
output :  tensor([[127070.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(1146522.2500, grad_fn=<MseLossBackward>)
output :  tensor([[136926.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(182315.6562, grad_fn=<MseLossBackward>)
output :  tensor([[169932.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(9412241., grad_fn=<MseLossBackward>)
output :  tensor([[197814.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7234e+09, grad_fn=<MseLossBackward>)
output :  tensor([[241168.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(3354449.5000, grad_fn=<MseLossBackward>)
output :  tensor([[154354.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(416125.7812, grad_fn=<MseLossBackward>)
output :  tensor([[204748.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(76535704., grad_fn=<MseLossBackward>)
output :  tensor([[162897.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5712e+08, grad_fn=<MseLossBackward>)
output :  tensor([[183330.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(14669977., grad_fn=<MseLossBackward>)
output :  tensor([[179040.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(739519.3750, grad_fn=<MseLossBackward>)
output :  tensor([[99685.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(7211155., grad_fn=<MseLossBackward>)
output :  tensor([[172935.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1463e+10, grad_fn=<MseLossBackward>)
output :  tensor([[137768.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(7663813.5000, grad_fn=<MseLossBackward>)
output :  tensor([[120565.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(30970704., grad_fn=<MseLossBackward>)
output :  tensor([[171191.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(7885390.5000, grad_fn=<MseLossBackward>)
output :  tensor([[84633.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(134574.3438, grad_fn=<MseLossBackward>)
output :  tensor([[285601.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(19348726., grad_fn=<MseLossBackward>)
output :  tensor([[167312.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(5348017.5000, grad_fn=<MseLossBackward>)
output :  tensor([[191796.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9986e+10, grad_fn=<MseLossBackward>)
output :  tensor([[249523.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6124e+08, grad_fn=<MseLossBackward>)
output :  tensor([[151002.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4932, grad_fn=<MseLossBackward>)
output :  tensor([[122924.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1157540.6250, grad_fn=<MseLossBackward>)
output :  tensor([[127563.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(58731028., grad_fn=<MseLossBackward>)
output :  tensor([[146181.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(9.7227e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173643.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(127103.3906, grad_fn=<MseLossBackward>)
output :  tensor([[112919.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2534e+08, grad_fn=<MseLossBackward>)
output :  tensor([[212217.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1190e+10, grad_fn=<MseLossBackward>)
output :  tensor([[237024.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(20032338., grad_fn=<MseLossBackward>)
output :  tensor([[251906.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0531e+10, grad_fn=<MseLossBackward>)
output :  tensor([[219553.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7815e+08, grad_fn=<MseLossBackward>)
output :  tensor([[195148.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4484e+10, grad_fn=<MseLossBackward>)
output :  tensor([[189649.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(4619544., grad_fn=<MseLossBackward>)
output :  tensor([[206954.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7487e+10, grad_fn=<MseLossBackward>)
output :  tensor([[191489.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0883e+10, grad_fn=<MseLossBackward>)
output :  tensor([[175334.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(11599452., grad_fn=<MseLossBackward>)
output :  tensor([[153196.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1432135.7500, grad_fn=<MseLossBackward>)
output :  tensor([[331592.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(29240042., grad_fn=<MseLossBackward>)
output :  tensor([[213131.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1279903.3750, grad_fn=<MseLossBackward>)
output :  tensor([[162672.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(7141755., grad_fn=<MseLossBackward>)
output :  tensor([[187970.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8654e+09, grad_fn=<MseLossBackward>)
output :  tensor([[107775.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(7701535.5000, grad_fn=<MseLossBackward>)
output :  tensor([[273571.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9202e+10, grad_fn=<MseLossBackward>)
output :  tensor([[170273.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(13150256., grad_fn=<MseLossBackward>)
output :  tensor([[210610.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(8350474.5000, grad_fn=<MseLossBackward>)
output :  tensor([[212575.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(70965880., grad_fn=<MseLossBackward>)
output :  tensor([[181747.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(6492145., grad_fn=<MseLossBackward>)
output :  tensor([[201066.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(537793.0625, grad_fn=<MseLossBackward>)
output :  tensor([[157757.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(7601135., grad_fn=<MseLossBackward>)
output :  tensor([[149066.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4075e+09, grad_fn=<MseLossBackward>)
output :  tensor([[120956.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(6035121.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140402.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(161893.0625, grad_fn=<MseLossBackward>)
output :  tensor([[147202.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(3231961.2500, grad_fn=<MseLossBackward>)
output :  tensor([[201321.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6047e+10, grad_fn=<MseLossBackward>)
output :  tensor([[159614.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(13203.4463, grad_fn=<MseLossBackward>)
output :  tensor([[101211.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2928109.2500, grad_fn=<MseLossBackward>)
output :  tensor([[226346.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8642e+08, grad_fn=<MseLossBackward>)
output :  tensor([[185445.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9784e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176479.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(35.6260, grad_fn=<MseLossBackward>)
output :  tensor([[87831.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(34009580., grad_fn=<MseLossBackward>)
output :  tensor([[129926.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2035838.5000, grad_fn=<MseLossBackward>)
output :  tensor([[214594.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(353244.5000, grad_fn=<MseLossBackward>)
output :  tensor([[141769.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(4976385., grad_fn=<MseLossBackward>)
output :  tensor([[127980.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(4078569.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145290.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(7236772.5000, grad_fn=<MseLossBackward>)
output :  tensor([[176926.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5544e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144928.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(862315.3750, grad_fn=<MseLossBackward>)
output :  tensor([[160704.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(496320.2500, grad_fn=<MseLossBackward>)
output :  tensor([[214663.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(113347.9531, grad_fn=<MseLossBackward>)
output :  tensor([[135549.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(9.3325e+08, grad_fn=<MseLossBackward>)
output :  tensor([[257974.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(8847093., grad_fn=<MseLossBackward>)
output :  tensor([[156989.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(6304650., grad_fn=<MseLossBackward>)
output :  tensor([[131046.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(6487129.5000, grad_fn=<MseLossBackward>)
output :  tensor([[95369.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(136207.1250, grad_fn=<MseLossBackward>)
output :  tensor([[157497.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3286e+09, grad_fn=<MseLossBackward>)
output :  tensor([[180337.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(191748.2031, grad_fn=<MseLossBackward>)
output :  tensor([[118871.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2652012.2500, grad_fn=<MseLossBackward>)
output :  tensor([[189389.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5650e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144731.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2551e+09, grad_fn=<MseLossBackward>)
output :  tensor([[149233.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(444368.0625, grad_fn=<MseLossBackward>)
output :  tensor([[187504.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(60285.5938, grad_fn=<MseLossBackward>)
output :  tensor([[251793.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7043e+09, grad_fn=<MseLossBackward>)
output :  tensor([[88238.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(10638503., grad_fn=<MseLossBackward>)
output :  tensor([[242254.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(5084320.5000, grad_fn=<MseLossBackward>)
output :  tensor([[131080.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(6656561.5000, grad_fn=<MseLossBackward>)
output :  tensor([[165818.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0016e+10, grad_fn=<MseLossBackward>)
output :  tensor([[112890.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6616e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172292.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(13746599., grad_fn=<MseLossBackward>)
output :  tensor([[162919.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5316e+08, grad_fn=<MseLossBackward>)
output :  tensor([[150970.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1902e+08, grad_fn=<MseLossBackward>)
output :  tensor([[233092.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(34893756., grad_fn=<MseLossBackward>)
output :  tensor([[224637.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1131e+09, grad_fn=<MseLossBackward>)
output :  tensor([[128362.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(1857449.5000, grad_fn=<MseLossBackward>)
output :  tensor([[129192.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(10194900., grad_fn=<MseLossBackward>)
output :  tensor([[227963.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(928783.9375, grad_fn=<MseLossBackward>)
output :  tensor([[229583.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(19505472., grad_fn=<MseLossBackward>)
output :  tensor([[226838.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(19173.5938, grad_fn=<MseLossBackward>)
output :  tensor([[147603.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(157224.6406, grad_fn=<MseLossBackward>)
output :  tensor([[212717.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(7386505., grad_fn=<MseLossBackward>)
output :  tensor([[132091.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4619e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130626.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3510002.2500, grad_fn=<MseLossBackward>)
output :  tensor([[308396.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(43611576., grad_fn=<MseLossBackward>)
output :  tensor([[137593.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(11605413., grad_fn=<MseLossBackward>)
output :  tensor([[120598.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8728e+09, grad_fn=<MseLossBackward>)
output :  tensor([[109446.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2868.9414, grad_fn=<MseLossBackward>)
output :  tensor([[155488.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8939e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180451.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8875e+09, grad_fn=<MseLossBackward>)
output :  tensor([[171329.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2789056.5000, grad_fn=<MseLossBackward>)
output :  tensor([[193987.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(49169240., grad_fn=<MseLossBackward>)
output :  tensor([[106677.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(44586816., grad_fn=<MseLossBackward>)
output :  tensor([[180219.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1486646.7500, grad_fn=<MseLossBackward>)
output :  tensor([[170963.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(9387330., grad_fn=<MseLossBackward>)
output :  tensor([[137664.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1782266.7500, grad_fn=<MseLossBackward>)
output :  tensor([[257903.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0241e+10, grad_fn=<MseLossBackward>)
output :  tensor([[141753.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2209e+09, grad_fn=<MseLossBackward>)
output :  tensor([[175391.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(5718525., grad_fn=<MseLossBackward>)
output :  tensor([[140917.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(840917.6875, grad_fn=<MseLossBackward>)
output :  tensor([[198916.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2509006.5000, grad_fn=<MseLossBackward>)
output :  tensor([[168189.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(3278306.2500, grad_fn=<MseLossBackward>)
output :  tensor([[241318.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(7192034.5000, grad_fn=<MseLossBackward>)
output :  tensor([[131369.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(9797683., grad_fn=<MseLossBackward>)
output :  tensor([[150495.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1311526., grad_fn=<MseLossBackward>)
output :  tensor([[211260.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(13983276., grad_fn=<MseLossBackward>)
output :  tensor([[165398.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(159088.7969, grad_fn=<MseLossBackward>)
output :  tensor([[185677.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(11041394., grad_fn=<MseLossBackward>)
output :  tensor([[133825.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3375e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129023.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(535.1270, grad_fn=<MseLossBackward>)
output :  tensor([[146547.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(42864640., grad_fn=<MseLossBackward>)
output :  tensor([[202444.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4964e+09, grad_fn=<MseLossBackward>)
output :  tensor([[165034.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5035e+09, grad_fn=<MseLossBackward>)
output :  tensor([[74780.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1847e+08, grad_fn=<MseLossBackward>)
output :  tensor([[94218.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(94448936., grad_fn=<MseLossBackward>)
output :  tensor([[246652.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(44101012., grad_fn=<MseLossBackward>)
output :  tensor([[203850.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2056e+09, grad_fn=<MseLossBackward>)
output :  tensor([[115483.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(233772.2500, grad_fn=<MseLossBackward>)
output :  tensor([[162575.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2124e+08, grad_fn=<MseLossBackward>)
output :  tensor([[207390.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5900e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181135.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8968e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159876.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(23778424., grad_fn=<MseLossBackward>)
output :  tensor([[168488.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(2284679.5000, grad_fn=<MseLossBackward>)
output :  tensor([[117429.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(5904786., grad_fn=<MseLossBackward>)
output :  tensor([[160635.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(31755338., grad_fn=<MseLossBackward>)
output :  tensor([[193273.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8567e+08, grad_fn=<MseLossBackward>)
output :  tensor([[217092.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(5798238.5000, grad_fn=<MseLossBackward>)
output :  tensor([[242542.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5246e+11, grad_fn=<MseLossBackward>)
output :  tensor([[146391.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(369759., grad_fn=<MseLossBackward>)
output :  tensor([[108810.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(109545.4844, grad_fn=<MseLossBackward>)
output :  tensor([[169189.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6155e+08, grad_fn=<MseLossBackward>)
output :  tensor([[151353.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(728435.5625, grad_fn=<MseLossBackward>)
output :  tensor([[236023.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(954498.5000, grad_fn=<MseLossBackward>)
output :  tensor([[116076.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1159390.5000, grad_fn=<MseLossBackward>)
output :  tensor([[179182.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(13823292., grad_fn=<MseLossBackward>)
output :  tensor([[183568.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(9803455., grad_fn=<MseLossBackward>)
output :  tensor([[162670.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4753e+10, grad_fn=<MseLossBackward>)
output :  tensor([[94270.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7610e+08, grad_fn=<MseLossBackward>)
output :  tensor([[232892.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(37304036., grad_fn=<MseLossBackward>)
output :  tensor([[176641.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(410981.1562, grad_fn=<MseLossBackward>)
output :  tensor([[141212.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1470080.5000, grad_fn=<MseLossBackward>)
output :  tensor([[236996.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(3986386.5000, grad_fn=<MseLossBackward>)
output :  tensor([[165413.]], grad_fn=<AddmmBackward>)
loss:  tensor(5822569., grad_fn=<MseLossBackward>)
output :  tensor([[206003.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4160e+10, grad_fn=<MseLossBackward>)
output :  tensor([[135652.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(425368.9062, grad_fn=<MseLossBackward>)
output :  tensor([[186609.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0561e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136700.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(490393.8438, grad_fn=<MseLossBackward>)
output :  tensor([[225970.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0059e+08, grad_fn=<MseLossBackward>)
output :  tensor([[227898.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8849e+08, grad_fn=<MseLossBackward>)
output :  tensor([[93465.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(12011315., grad_fn=<MseLossBackward>)
output :  tensor([[162951.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(12373246., grad_fn=<MseLossBackward>)
output :  tensor([[246453.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5482e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145488.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(238159.2500, grad_fn=<MseLossBackward>)
output :  tensor([[109567.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8120e+09, grad_fn=<MseLossBackward>)
output :  tensor([[162223.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(5183875., grad_fn=<MseLossBackward>)
output :  tensor([[145885.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(3554874.5000, grad_fn=<MseLossBackward>)
output :  tensor([[127528.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(450796.8438, grad_fn=<MseLossBackward>)
output :  tensor([[189332.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8535e+09, grad_fn=<MseLossBackward>)
output :  tensor([[124676.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4738921., grad_fn=<MseLossBackward>)
output :  tensor([[150506.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2229095.7500, grad_fn=<MseLossBackward>)
output :  tensor([[167834.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(15329794., grad_fn=<MseLossBackward>)
output :  tensor([[147747.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(10578350., grad_fn=<MseLossBackward>)
output :  tensor([[161488.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1990965.1250, grad_fn=<MseLossBackward>)
output :  tensor([[134215.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3583e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133126.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1269319.1250, grad_fn=<MseLossBackward>)
output :  tensor([[153544.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1154e+08, grad_fn=<MseLossBackward>)
output :  tensor([[145938.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(3192699., grad_fn=<MseLossBackward>)
output :  tensor([[163353.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2570460.7500, grad_fn=<MseLossBackward>)
output :  tensor([[134349.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9778e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148008.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(627090.7500, grad_fn=<MseLossBackward>)
output :  tensor([[183130.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(23709596., grad_fn=<MseLossBackward>)
output :  tensor([[169756.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(571937.6875, grad_fn=<MseLossBackward>)
output :  tensor([[180827.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(684626.9375, grad_fn=<MseLossBackward>)
output :  tensor([[218894.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1222786.7500, grad_fn=<MseLossBackward>)
output :  tensor([[112000.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(16813204., grad_fn=<MseLossBackward>)
output :  tensor([[135764.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1803e+08, grad_fn=<MseLossBackward>)
output :  tensor([[287047.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1097911., grad_fn=<MseLossBackward>)
output :  tensor([[118705.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(7320322., grad_fn=<MseLossBackward>)
output :  tensor([[177006.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8484e+09, grad_fn=<MseLossBackward>)
output :  tensor([[186887.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(3562243.2500, grad_fn=<MseLossBackward>)
output :  tensor([[181288.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(17736206., grad_fn=<MseLossBackward>)
output :  tensor([[248525.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0090e+08, grad_fn=<MseLossBackward>)
output :  tensor([[219212.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(7767978.5000, grad_fn=<MseLossBackward>)
output :  tensor([[124138.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3265e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176021.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3000e+08, grad_fn=<MseLossBackward>)
output :  tensor([[122451.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2398384.5000, grad_fn=<MseLossBackward>)
output :  tensor([[180649.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6631e+10, grad_fn=<MseLossBackward>)
output :  tensor([[148234.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(22705672., grad_fn=<MseLossBackward>)
output :  tensor([[153164.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(44413268., grad_fn=<MseLossBackward>)
output :  tensor([[204347.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3810365., grad_fn=<MseLossBackward>)
output :  tensor([[145805.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7704e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173804.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4822347.5000, grad_fn=<MseLossBackward>)
output :  tensor([[252612.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2296e+08, grad_fn=<MseLossBackward>)
output :  tensor([[147472.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(278173.8438, grad_fn=<MseLossBackward>)
output :  tensor([[202625.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1575.0977, grad_fn=<MseLossBackward>)
output :  tensor([[165532.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(31169016., grad_fn=<MseLossBackward>)
output :  tensor([[122045.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1591e+09, grad_fn=<MseLossBackward>)
output :  tensor([[133841.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(3644042.5000, grad_fn=<MseLossBackward>)
output :  tensor([[181054.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(8673485., grad_fn=<MseLossBackward>)
output :  tensor([[197212.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(52018804., grad_fn=<MseLossBackward>)
output :  tensor([[234509.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9692e+09, grad_fn=<MseLossBackward>)
output :  tensor([[253475.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(12419127., grad_fn=<MseLossBackward>)
output :  tensor([[188790.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6954e+10, grad_fn=<MseLossBackward>)
output :  tensor([[141654.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5154e+09, grad_fn=<MseLossBackward>)
output :  tensor([[147836.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(11133588., grad_fn=<MseLossBackward>)
output :  tensor([[71544.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9506e+08, grad_fn=<MseLossBackward>)
output :  tensor([[126459.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(72938272., grad_fn=<MseLossBackward>)
output :  tensor([[130978.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(4321948.5000, grad_fn=<MseLossBackward>)
output :  tensor([[153630.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(136207.1250, grad_fn=<MseLossBackward>)
output :  tensor([[129853.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(8144602.5000, grad_fn=<MseLossBackward>)
output :  tensor([[78140.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2690676.2500, grad_fn=<MseLossBackward>)
output :  tensor([[84022.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(4092371., grad_fn=<MseLossBackward>)
output :  tensor([[240559.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(73258088., grad_fn=<MseLossBackward>)
output :  tensor([[139021.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0339e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130326.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(30037.2227, grad_fn=<MseLossBackward>)
output :  tensor([[170147.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(9909117., grad_fn=<MseLossBackward>)
output :  tensor([[235047.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2256.2500, grad_fn=<MseLossBackward>)
output :  tensor([[191676.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(214658.4688, grad_fn=<MseLossBackward>)
output :  tensor([[152713.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(10801082., grad_fn=<MseLossBackward>)
output :  tensor([[196544.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1836109.7500, grad_fn=<MseLossBackward>)
output :  tensor([[205153.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0142e+09, grad_fn=<MseLossBackward>)
output :  tensor([[135239.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3098095., grad_fn=<MseLossBackward>)
output :  tensor([[154233.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(587186.9375, grad_fn=<MseLossBackward>)
output :  tensor([[137438.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2068563., grad_fn=<MseLossBackward>)
output :  tensor([[199961.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(9.0230e+08, grad_fn=<MseLossBackward>)
output :  tensor([[157043.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(9264985., grad_fn=<MseLossBackward>)
output :  tensor([[137291.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9177e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151588.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(44731852., grad_fn=<MseLossBackward>)
output :  tensor([[203983.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(64257760., grad_fn=<MseLossBackward>)
output :  tensor([[99681.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1262e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165695.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(3257348.2500, grad_fn=<MseLossBackward>)
output :  tensor([[131878.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(15041429., grad_fn=<MseLossBackward>)
output :  tensor([[145119.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(3535046.2500, grad_fn=<MseLossBackward>)
output :  tensor([[101465.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5275e+09, grad_fn=<MseLossBackward>)
output :  tensor([[139875.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(5643742.5000, grad_fn=<MseLossBackward>)
output :  tensor([[231354.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(21579074., grad_fn=<MseLossBackward>)
output :  tensor([[144905.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(8989.4102, grad_fn=<MseLossBackward>)
output :  tensor([[137404.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(9090.4307, grad_fn=<MseLossBackward>)
output :  tensor([[165745.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4247e+09, grad_fn=<MseLossBackward>)
output :  tensor([[268121.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(97584760., grad_fn=<MseLossBackward>)
output :  tensor([[170965.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(16273534., grad_fn=<MseLossBackward>)
output :  tensor([[104814.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(4155800.7500, grad_fn=<MseLossBackward>)
output :  tensor([[202768.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5848e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161959.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(8756791., grad_fn=<MseLossBackward>)
output :  tensor([[164127.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5496e+10, grad_fn=<MseLossBackward>)
output :  tensor([[100188.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3568025.7500, grad_fn=<MseLossBackward>)
output :  tensor([[122203.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1949339.5000, grad_fn=<MseLossBackward>)
output :  tensor([[153435.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(6577381.5000, grad_fn=<MseLossBackward>)
output :  tensor([[142060.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(4245209.5000, grad_fn=<MseLossBackward>)
output :  tensor([[202269.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(5150772., grad_fn=<MseLossBackward>)
output :  tensor([[135990.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(36114092., grad_fn=<MseLossBackward>)
output :  tensor([[262859.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(335421.9688, grad_fn=<MseLossBackward>)
output :  tensor([[129058.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3002e+09, grad_fn=<MseLossBackward>)
output :  tensor([[165585.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(7304.9072, grad_fn=<MseLossBackward>)
output :  tensor([[186848.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2728226.5000, grad_fn=<MseLossBackward>)
output :  tensor([[123434.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8048e+08, grad_fn=<MseLossBackward>)
output :  tensor([[249502.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(247801.7344, grad_fn=<MseLossBackward>)
output :  tensor([[159258.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6961e+08, grad_fn=<MseLossBackward>)
output :  tensor([[244333.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1032541.7500, grad_fn=<MseLossBackward>)
output :  tensor([[144646.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(418447.2500, grad_fn=<MseLossBackward>)
output :  tensor([[206141.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(14885370., grad_fn=<MseLossBackward>)
output :  tensor([[174552.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(4633054.5000, grad_fn=<MseLossBackward>)
output :  tensor([[152207.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3212608.2500, grad_fn=<MseLossBackward>)
output :  tensor([[115427.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(6616188.5000, grad_fn=<MseLossBackward>)
output :  tensor([[236664.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5427e+09, grad_fn=<MseLossBackward>)
output :  tensor([[237049.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(8704713., grad_fn=<MseLossBackward>)
output :  tensor([[153664.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(107113.0156, grad_fn=<MseLossBackward>)
output :  tensor([[256827.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3715738.2500, grad_fn=<MseLossBackward>)
output :  tensor([[125960.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3124e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179263.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(10649208., grad_fn=<MseLossBackward>)
output :  tensor([[162407.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(5798313.5000, grad_fn=<MseLossBackward>)
output :  tensor([[134967.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(15739321., grad_fn=<MseLossBackward>)
output :  tensor([[195100.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3034e+09, grad_fn=<MseLossBackward>)
output :  tensor([[165584.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2509947., grad_fn=<MseLossBackward>)
output :  tensor([[163747.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(558639.4375, grad_fn=<MseLossBackward>)
output :  tensor([[157594.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(164214.9062, grad_fn=<MseLossBackward>)
output :  tensor([[150455.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(308528.1875, grad_fn=<MseLossBackward>)
output :  tensor([[175015.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2923e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161454.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2115615.7500, grad_fn=<MseLossBackward>)
output :  tensor([[376973.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(48952324., grad_fn=<MseLossBackward>)
output :  tensor([[126750.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(62004.8906, grad_fn=<MseLossBackward>)
output :  tensor([[131167.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0855e+09, grad_fn=<MseLossBackward>)
output :  tensor([[281427.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(45889.6719, grad_fn=<MseLossBackward>)
output :  tensor([[161226.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(597867.2500, grad_fn=<MseLossBackward>)
output :  tensor([[129367.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(78639624., grad_fn=<MseLossBackward>)
output :  tensor([[241094.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(82716464., grad_fn=<MseLossBackward>)
output :  tensor([[178444.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(4224117., grad_fn=<MseLossBackward>)
output :  tensor([[155877.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(15034158., grad_fn=<MseLossBackward>)
output :  tensor([[143646.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1832892.8750, grad_fn=<MseLossBackward>)
output :  tensor([[155500.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4598e+08, grad_fn=<MseLossBackward>)
output :  tensor([[101812.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(3285949.2500, grad_fn=<MseLossBackward>)
output :  tensor([[72430.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5452e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165601.]], grad_fn=<AddmmBackward>)
loss:  tensor(361201., grad_fn=<MseLossBackward>)
output :  tensor([[190106.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4359e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157802.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(38907.5625, grad_fn=<MseLossBackward>)
output :  tensor([[157026.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(224291.0469, grad_fn=<MseLossBackward>)
output :  tensor([[137195.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(64929.4102, grad_fn=<MseLossBackward>)
output :  tensor([[202505.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(11866948., grad_fn=<MseLossBackward>)
output :  tensor([[139507.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(2272509.2500, grad_fn=<MseLossBackward>)
output :  tensor([[183476.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6008e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144915.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1176580.8750, grad_fn=<MseLossBackward>)
output :  tensor([[108226.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3637e+08, grad_fn=<MseLossBackward>)
output :  tensor([[93569.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(185707.1250, grad_fn=<MseLossBackward>)
output :  tensor([[175755.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(571110.8125, grad_fn=<MseLossBackward>)
output :  tensor([[262990.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(6709557., grad_fn=<MseLossBackward>)
output :  tensor([[140531.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(937447.5625, grad_fn=<MseLossBackward>)
output :  tensor([[160057.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(26299.7168, grad_fn=<MseLossBackward>)
output :  tensor([[133317.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(668178.5000, grad_fn=<MseLossBackward>)
output :  tensor([[148923.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(331884., grad_fn=<MseLossBackward>)
output :  tensor([[165940.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(3840436.2500, grad_fn=<MseLossBackward>)
output :  tensor([[128230.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(1512919.2500, grad_fn=<MseLossBackward>)
output :  tensor([[173634.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1994e+08, grad_fn=<MseLossBackward>)
output :  tensor([[158837.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(3377497.2500, grad_fn=<MseLossBackward>)
output :  tensor([[118673.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(4724577.5000, grad_fn=<MseLossBackward>)
output :  tensor([[160506.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2553e+09, grad_fn=<MseLossBackward>)
output :  tensor([[54682.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(7196686.5000, grad_fn=<MseLossBackward>)
output :  tensor([[232526.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3958e+09, grad_fn=<MseLossBackward>)
output :  tensor([[199896.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1218505.5000, grad_fn=<MseLossBackward>)
output :  tensor([[183681.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1738318.6250, grad_fn=<MseLossBackward>)
output :  tensor([[106651.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(424615.1250, grad_fn=<MseLossBackward>)
output :  tensor([[90119.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(9731134., grad_fn=<MseLossBackward>)
output :  tensor([[137448.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(6509036., grad_fn=<MseLossBackward>)
output :  tensor([[221391.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2720e+09, grad_fn=<MseLossBackward>)
output :  tensor([[203846.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(13349661., grad_fn=<MseLossBackward>)
output :  tensor([[166817.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(3301886.5000, grad_fn=<MseLossBackward>)
output :  tensor([[175096.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0827e+09, grad_fn=<MseLossBackward>)
output :  tensor([[190795.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(632372.8750, grad_fn=<MseLossBackward>)
output :  tensor([[91080.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(16653286., grad_fn=<MseLossBackward>)
output :  tensor([[140447.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(200116.4375, grad_fn=<MseLossBackward>)
output :  tensor([[109914.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(343386.8438, grad_fn=<MseLossBackward>)
output :  tensor([[148204.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4994e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172871.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7532e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192115.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6601e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180375.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(141105.8750, grad_fn=<MseLossBackward>)
output :  tensor([[97781.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1642202.2500, grad_fn=<MseLossBackward>)
output :  tensor([[119131.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(2663143.5000, grad_fn=<MseLossBackward>)
output :  tensor([[161586.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0237e+08, grad_fn=<MseLossBackward>)
output :  tensor([[197764.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(4997600., grad_fn=<MseLossBackward>)
output :  tensor([[146466.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(6084084.5000, grad_fn=<MseLossBackward>)
train_loss: [2.5963684e+09]
epoch_result tensor([0.])
output :  tensor([[157162.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1790035., grad_fn=<MseLossBackward>)
output :  tensor([[120966.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(1067169.7500, grad_fn=<MseLossBackward>)
output :  tensor([[193988.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(45216.0352, grad_fn=<MseLossBackward>)
output :  tensor([[178926.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3711041., grad_fn=<MseLossBackward>)
output :  tensor([[153310.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0958e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129364.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1860751.7500, grad_fn=<MseLossBackward>)
output :  tensor([[141076.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(5883.3691, grad_fn=<MseLossBackward>)
output :  tensor([[117565.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(2059023.2500, grad_fn=<MseLossBackward>)
output :  tensor([[66953.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(71459024., grad_fn=<MseLossBackward>)
output :  tensor([[167015.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1030669.1250, grad_fn=<MseLossBackward>)
output :  tensor([[134946.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(25534546., grad_fn=<MseLossBackward>)
output :  tensor([[224521.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(228842.6406, grad_fn=<MseLossBackward>)
output :  tensor([[168715.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(80744.7734, grad_fn=<MseLossBackward>)
output :  tensor([[248752.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(898052.3750, grad_fn=<MseLossBackward>)
output :  tensor([[57562.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(6567127., grad_fn=<MseLossBackward>)
output :  tensor([[160759.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6436e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176485.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2205410.7500, grad_fn=<MseLossBackward>)
output :  tensor([[163315.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(46454236., grad_fn=<MseLossBackward>)
output :  tensor([[275014.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(221.2656, grad_fn=<MseLossBackward>)
output :  tensor([[195618.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1908715., grad_fn=<MseLossBackward>)
output :  tensor([[137612.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5563e+10, grad_fn=<MseLossBackward>)
output :  tensor([[195643.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(3112798.5000, grad_fn=<MseLossBackward>)
output :  tensor([[177114.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2834e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151630.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(397549.9688, grad_fn=<MseLossBackward>)
output :  tensor([[173702.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(13705382., grad_fn=<MseLossBackward>)
output :  tensor([[87520.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(4494797.5000, grad_fn=<MseLossBackward>)
output :  tensor([[168738.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1068e+09, grad_fn=<MseLossBackward>)
output :  tensor([[188027.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(9166892., grad_fn=<MseLossBackward>)
output :  tensor([[206856.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3662e+09, grad_fn=<MseLossBackward>)
output :  tensor([[110859.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(738646.2500, grad_fn=<MseLossBackward>)
output :  tensor([[171913.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(833997., grad_fn=<MseLossBackward>)
output :  tensor([[136737.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(56450.7891, grad_fn=<MseLossBackward>)
output :  tensor([[125994.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(9035191., grad_fn=<MseLossBackward>)
output :  tensor([[120234.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(539490.2500, grad_fn=<MseLossBackward>)
output :  tensor([[145768.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2765e+08, grad_fn=<MseLossBackward>)
output :  tensor([[169550.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1155e+10, grad_fn=<MseLossBackward>)
output :  tensor([[148783.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(839915., grad_fn=<MseLossBackward>)
output :  tensor([[178945.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1112794.2500, grad_fn=<MseLossBackward>)
output :  tensor([[141449.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(202092.3906, grad_fn=<MseLossBackward>)
output :  tensor([[105944.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5422e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135019.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3969e+09, grad_fn=<MseLossBackward>)
output :  tensor([[133499.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2251172., grad_fn=<MseLossBackward>)
output :  tensor([[135544.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(73005544., grad_fn=<MseLossBackward>)
output :  tensor([[221425.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(12778838., grad_fn=<MseLossBackward>)
output :  tensor([[129291.4922]], grad_fn=<AddmmBackward>)
loss:  tensor(8752768., grad_fn=<MseLossBackward>)
output :  tensor([[150407.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1981320.1250, grad_fn=<MseLossBackward>)
output :  tensor([[109615.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(5683530.5000, grad_fn=<MseLossBackward>)
output :  tensor([[161499.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2249672., grad_fn=<MseLossBackward>)
output :  tensor([[144060.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5949e+09, grad_fn=<MseLossBackward>)
output :  tensor([[190195.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(3256727.7500, grad_fn=<MseLossBackward>)
output :  tensor([[133095.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1834035.3750, grad_fn=<MseLossBackward>)
output :  tensor([[111158.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(1342031.7500, grad_fn=<MseLossBackward>)
output :  tensor([[227252.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(45530656., grad_fn=<MseLossBackward>)
output :  tensor([[165754.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2786e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150101.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(79186920., grad_fn=<MseLossBackward>)
output :  tensor([[202285.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8973e+10, grad_fn=<MseLossBackward>)
output :  tensor([[249715.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0875e+10, grad_fn=<MseLossBackward>)
output :  tensor([[141410.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(4367447., grad_fn=<MseLossBackward>)
output :  tensor([[134260.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(67746.3281, grad_fn=<MseLossBackward>)
output :  tensor([[157250.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(5063976.5000, grad_fn=<MseLossBackward>)
output :  tensor([[131129.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1274746.8750, grad_fn=<MseLossBackward>)
output :  tensor([[180693.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2896e+09, grad_fn=<MseLossBackward>)
output :  tensor([[181734.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(5596403.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163452.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(3813171.5000, grad_fn=<MseLossBackward>)
output :  tensor([[148632.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(31726112., grad_fn=<MseLossBackward>)
output :  tensor([[144720.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(4928885.5000, grad_fn=<MseLossBackward>)
output :  tensor([[141587.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(11647929., grad_fn=<MseLossBackward>)
output :  tensor([[173871.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3315e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195373.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6770e+08, grad_fn=<MseLossBackward>)
output :  tensor([[138942.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(5965119.5000, grad_fn=<MseLossBackward>)
output :  tensor([[171346.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(306120.1562, grad_fn=<MseLossBackward>)
output :  tensor([[176956.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(16346733., grad_fn=<MseLossBackward>)
output :  tensor([[114731.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(72247.5625, grad_fn=<MseLossBackward>)
output :  tensor([[221190.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(36195.0625, grad_fn=<MseLossBackward>)
output :  tensor([[179773.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(13888316., grad_fn=<MseLossBackward>)
output :  tensor([[127505.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(4023942., grad_fn=<MseLossBackward>)
output :  tensor([[193680.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(7947906.5000, grad_fn=<MseLossBackward>)
output :  tensor([[174656.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(59147.7617, grad_fn=<MseLossBackward>)
output :  tensor([[212031.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0352e+10, grad_fn=<MseLossBackward>)
output :  tensor([[209303.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2879172.7500, grad_fn=<MseLossBackward>)
output :  tensor([[166070.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2299e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192496.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(4013887., grad_fn=<MseLossBackward>)
output :  tensor([[110435.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(6577582., grad_fn=<MseLossBackward>)
output :  tensor([[115342.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(8080783.5000, grad_fn=<MseLossBackward>)
output :  tensor([[110282.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2950182., grad_fn=<MseLossBackward>)
output :  tensor([[149337.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(6440333.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163019.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2265e+10, grad_fn=<MseLossBackward>)
output :  tensor([[178723.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1630409.7500, grad_fn=<MseLossBackward>)
output :  tensor([[126680.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(672246.2500, grad_fn=<MseLossBackward>)
output :  tensor([[142561.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(5947196.5000, grad_fn=<MseLossBackward>)
output :  tensor([[180325.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0635e+09, grad_fn=<MseLossBackward>)
output :  tensor([[118763.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(3472253.7500, grad_fn=<MseLossBackward>)
output :  tensor([[200109.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(9671225., grad_fn=<MseLossBackward>)
output :  tensor([[147295.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(5268531., grad_fn=<MseLossBackward>)
output :  tensor([[211043.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(3447984.7500, grad_fn=<MseLossBackward>)
output :  tensor([[128899.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(8405243., grad_fn=<MseLossBackward>)
output :  tensor([[245399.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(8574282., grad_fn=<MseLossBackward>)
output :  tensor([[240569.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9740e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146167.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1808e+08, grad_fn=<MseLossBackward>)
output :  tensor([[84333.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4444e+08, grad_fn=<MseLossBackward>)
output :  tensor([[194077.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5323e+09, grad_fn=<MseLossBackward>)
output :  tensor([[84996.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(15970264., grad_fn=<MseLossBackward>)
output :  tensor([[141034.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2354786.2500, grad_fn=<MseLossBackward>)
output :  tensor([[76309.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(654784.4375, grad_fn=<MseLossBackward>)
output :  tensor([[144641.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2851771., grad_fn=<MseLossBackward>)
output :  tensor([[176650.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(423556.9062, grad_fn=<MseLossBackward>)
output :  tensor([[152722.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(603971.8125, grad_fn=<MseLossBackward>)
output :  tensor([[109512.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(4460808., grad_fn=<MseLossBackward>)
output :  tensor([[204409.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2397e+10, grad_fn=<MseLossBackward>)
output :  tensor([[125688.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(7904224.5000, grad_fn=<MseLossBackward>)
output :  tensor([[271108.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(79055992., grad_fn=<MseLossBackward>)
output :  tensor([[301177.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(77834856., grad_fn=<MseLossBackward>)
output :  tensor([[108155.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(429864.6250, grad_fn=<MseLossBackward>)
output :  tensor([[168336.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(17333432., grad_fn=<MseLossBackward>)
output :  tensor([[135704.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6752e+08, grad_fn=<MseLossBackward>)
output :  tensor([[141732.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(7464678., grad_fn=<MseLossBackward>)
output :  tensor([[130639.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(151819.8125, grad_fn=<MseLossBackward>)
output :  tensor([[126644.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2703455.2500, grad_fn=<MseLossBackward>)
output :  tensor([[132859.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4568e+08, grad_fn=<MseLossBackward>)
output :  tensor([[228477.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7839e+10, grad_fn=<MseLossBackward>)
output :  tensor([[191240.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2428e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144067.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(28182.0156, grad_fn=<MseLossBackward>)
output :  tensor([[132058.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(20782060., grad_fn=<MseLossBackward>)
output :  tensor([[112571.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1746816.5000, grad_fn=<MseLossBackward>)
output :  tensor([[256985.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7303e+09, grad_fn=<MseLossBackward>)
output :  tensor([[134779.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(48668.4961, grad_fn=<MseLossBackward>)
output :  tensor([[199481.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(12379183., grad_fn=<MseLossBackward>)
output :  tensor([[112473.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(57358848., grad_fn=<MseLossBackward>)
output :  tensor([[137635.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(5356548.5000, grad_fn=<MseLossBackward>)
output :  tensor([[210717.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8995e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179978.]], grad_fn=<AddmmBackward>)
loss:  tensor(6084., grad_fn=<MseLossBackward>)
output :  tensor([[187447.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(5988956., grad_fn=<MseLossBackward>)
output :  tensor([[164242.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0955e+10, grad_fn=<MseLossBackward>)
output :  tensor([[302998.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0241e+09, grad_fn=<MseLossBackward>)
output :  tensor([[196736.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1354823.2500, grad_fn=<MseLossBackward>)
output :  tensor([[260926.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0145e+10, grad_fn=<MseLossBackward>)
output :  tensor([[221283.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9996e+09, grad_fn=<MseLossBackward>)
output :  tensor([[285359.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0011e+09, grad_fn=<MseLossBackward>)
output :  tensor([[223632.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(135205.5938, grad_fn=<MseLossBackward>)
output :  tensor([[222269.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8808e+10, grad_fn=<MseLossBackward>)
output :  tensor([[198079.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1164578.2500, grad_fn=<MseLossBackward>)
output :  tensor([[158684.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8119e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134637.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(4567036., grad_fn=<MseLossBackward>)
output :  tensor([[135305.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(37757.3477, grad_fn=<MseLossBackward>)
output :  tensor([[89938.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1126185.2500, grad_fn=<MseLossBackward>)
output :  tensor([[106283.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2945782.2500, grad_fn=<MseLossBackward>)
output :  tensor([[274785.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9283e+09, grad_fn=<MseLossBackward>)
output :  tensor([[231251.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(14048792., grad_fn=<MseLossBackward>)
output :  tensor([[146617.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2617216.2500, grad_fn=<MseLossBackward>)
output :  tensor([[135818.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2826286.2500, grad_fn=<MseLossBackward>)
output :  tensor([[175522.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3201974.7500, grad_fn=<MseLossBackward>)
output :  tensor([[142358.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(8359597.5000, grad_fn=<MseLossBackward>)
output :  tensor([[167438.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3234e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165841.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(708201.1250, grad_fn=<MseLossBackward>)
output :  tensor([[136226.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(597698.1250, grad_fn=<MseLossBackward>)
output :  tensor([[189841.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5349e+09, grad_fn=<MseLossBackward>)
output :  tensor([[114600.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(6760487.5000, grad_fn=<MseLossBackward>)
output :  tensor([[177008.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(25088360., grad_fn=<MseLossBackward>)
output :  tensor([[121147.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1316003.2500, grad_fn=<MseLossBackward>)
output :  tensor([[88358.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1845012.8750, grad_fn=<MseLossBackward>)
output :  tensor([[179917.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(6808.8281, grad_fn=<MseLossBackward>)
output :  tensor([[113405.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(12286175., grad_fn=<MseLossBackward>)
output :  tensor([[238601.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(158876.9844, grad_fn=<MseLossBackward>)
output :  tensor([[246369.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1875487.5000, grad_fn=<MseLossBackward>)
output :  tensor([[127155.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(5497596., grad_fn=<MseLossBackward>)
output :  tensor([[112734.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(14253633., grad_fn=<MseLossBackward>)
output :  tensor([[289238.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1879e+10, grad_fn=<MseLossBackward>)
output :  tensor([[171978.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(229231.4844, grad_fn=<MseLossBackward>)
output :  tensor([[121450.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(12596177., grad_fn=<MseLossBackward>)
output :  tensor([[142937.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2187e+08, grad_fn=<MseLossBackward>)
output :  tensor([[204006.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(99870976., grad_fn=<MseLossBackward>)
output :  tensor([[142264.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1598209.5000, grad_fn=<MseLossBackward>)
output :  tensor([[159229.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4585e+10, grad_fn=<MseLossBackward>)
output :  tensor([[153140.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(577148.8125, grad_fn=<MseLossBackward>)
output :  tensor([[131723.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(4942701.5000, grad_fn=<MseLossBackward>)
output :  tensor([[248750.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6835e+10, grad_fn=<MseLossBackward>)
output :  tensor([[396926.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(25743890., grad_fn=<MseLossBackward>)
output :  tensor([[110682.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(2829623.2500, grad_fn=<MseLossBackward>)
output :  tensor([[111422.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(50092664., grad_fn=<MseLossBackward>)
output :  tensor([[159904.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(163380.1719, grad_fn=<MseLossBackward>)
output :  tensor([[131683.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9802e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163244.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4522e+09, grad_fn=<MseLossBackward>)
output :  tensor([[175074.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2347e+09, grad_fn=<MseLossBackward>)
output :  tensor([[104523.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(853415.1250, grad_fn=<MseLossBackward>)
output :  tensor([[139450.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2400272.5000, grad_fn=<MseLossBackward>)
output :  tensor([[364524.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(7667534., grad_fn=<MseLossBackward>)
output :  tensor([[206503.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2559e+09, grad_fn=<MseLossBackward>)
output :  tensor([[178625.]], grad_fn=<AddmmBackward>)
loss:  tensor(9765625., grad_fn=<MseLossBackward>)
output :  tensor([[197294.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(31418302., grad_fn=<MseLossBackward>)
output :  tensor([[139371.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(137907.7812, grad_fn=<MseLossBackward>)
output :  tensor([[196937.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(5941558.5000, grad_fn=<MseLossBackward>)
output :  tensor([[136128.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1958e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177903.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(9589473., grad_fn=<MseLossBackward>)
output :  tensor([[237993.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(16051416., grad_fn=<MseLossBackward>)
output :  tensor([[174607.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(368999.3125, grad_fn=<MseLossBackward>)
output :  tensor([[107927.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(5283.4727, grad_fn=<MseLossBackward>)
output :  tensor([[265172.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(373511.9688, grad_fn=<MseLossBackward>)
output :  tensor([[252763.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(7637709.5000, grad_fn=<MseLossBackward>)
output :  tensor([[127450.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(19804726., grad_fn=<MseLossBackward>)
output :  tensor([[216708.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3979e+09, grad_fn=<MseLossBackward>)
output :  tensor([[305418.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9528e+08, grad_fn=<MseLossBackward>)
output :  tensor([[209173.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(4725936.5000, grad_fn=<MseLossBackward>)
output :  tensor([[214484.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5754e+10, grad_fn=<MseLossBackward>)
output :  tensor([[161947.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(16385419., grad_fn=<MseLossBackward>)
output :  tensor([[167002.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(8927117., grad_fn=<MseLossBackward>)
output :  tensor([[158011.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1165590.1250, grad_fn=<MseLossBackward>)
output :  tensor([[169327.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(451731., grad_fn=<MseLossBackward>)
output :  tensor([[241592.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9737e+08, grad_fn=<MseLossBackward>)
output :  tensor([[224151.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(28136394., grad_fn=<MseLossBackward>)
output :  tensor([[160256.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7573e+08, grad_fn=<MseLossBackward>)
output :  tensor([[121500.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2249343.7500, grad_fn=<MseLossBackward>)
output :  tensor([[177808.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(653192.3125, grad_fn=<MseLossBackward>)
output :  tensor([[180651.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2962e+09, grad_fn=<MseLossBackward>)
output :  tensor([[209017.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4447e+10, grad_fn=<MseLossBackward>)
output :  tensor([[132118.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(5353800.5000, grad_fn=<MseLossBackward>)
output :  tensor([[150315.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2460e+08, grad_fn=<MseLossBackward>)
output :  tensor([[276501.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(248408.7969, grad_fn=<MseLossBackward>)
output :  tensor([[90177.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(26801814., grad_fn=<MseLossBackward>)
output :  tensor([[239000.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(6253750.5000, grad_fn=<MseLossBackward>)
output :  tensor([[256487.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0657e+11, grad_fn=<MseLossBackward>)
output :  tensor([[172774.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(7698630.5000, grad_fn=<MseLossBackward>)
output :  tensor([[195550.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5563e+09, grad_fn=<MseLossBackward>)
output :  tensor([[156748.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(3058290.5000, grad_fn=<MseLossBackward>)
output :  tensor([[205752.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1278e+09, grad_fn=<MseLossBackward>)
output :  tensor([[127845.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(1332094.6250, grad_fn=<MseLossBackward>)
output :  tensor([[144697.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(91458.9922, grad_fn=<MseLossBackward>)
output :  tensor([[169476.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2775e+08, grad_fn=<MseLossBackward>)
output :  tensor([[187103.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1570713.8750, grad_fn=<MseLossBackward>)
output :  tensor([[125907.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(8566.3701, grad_fn=<MseLossBackward>)
output :  tensor([[137143.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(414534.7812, grad_fn=<MseLossBackward>)
output :  tensor([[177677.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(21877984., grad_fn=<MseLossBackward>)
output :  tensor([[196842.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8257e+09, grad_fn=<MseLossBackward>)
output :  tensor([[241307.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2863234.2500, grad_fn=<MseLossBackward>)
output :  tensor([[153820.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1390851.6250, grad_fn=<MseLossBackward>)
output :  tensor([[198104.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(4430367., grad_fn=<MseLossBackward>)
output :  tensor([[161921.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2120e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180149.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(421627., grad_fn=<MseLossBackward>)
output :  tensor([[181341.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2078868.3750, grad_fn=<MseLossBackward>)
output :  tensor([[100001.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(9011723., grad_fn=<MseLossBackward>)
output :  tensor([[171754.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1717e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134319.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(463697.1562, grad_fn=<MseLossBackward>)
output :  tensor([[120599.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(31356850., grad_fn=<MseLossBackward>)
output :  tensor([[171440.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(6549760.5000, grad_fn=<MseLossBackward>)
output :  tensor([[83625.1016]], grad_fn=<AddmmBackward>)
loss:  tensor(1890345.7500, grad_fn=<MseLossBackward>)
output :  tensor([[286213.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(14340422., grad_fn=<MseLossBackward>)
output :  tensor([[168851.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(14833450., grad_fn=<MseLossBackward>)
output :  tensor([[194984.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9095e+10, grad_fn=<MseLossBackward>)
output :  tensor([[248647.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9961e+08, grad_fn=<MseLossBackward>)
output :  tensor([[150104.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(802452.0625, grad_fn=<MseLossBackward>)
output :  tensor([[125037.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(1076746.7500, grad_fn=<MseLossBackward>)
output :  tensor([[123324.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(11725060., grad_fn=<MseLossBackward>)
output :  tensor([[144731.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8399e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173074.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(856058.6250, grad_fn=<MseLossBackward>)
output :  tensor([[112827.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(9.1975e+08, grad_fn=<MseLossBackward>)
output :  tensor([[209522.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1767e+10, grad_fn=<MseLossBackward>)
output :  tensor([[241031.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(219902.3750, grad_fn=<MseLossBackward>)
output :  tensor([[253418.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0100e+10, grad_fn=<MseLossBackward>)
output :  tensor([[220597.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3864e+08, grad_fn=<MseLossBackward>)
output :  tensor([[198018.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3802e+10, grad_fn=<MseLossBackward>)
output :  tensor([[189078.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2492846.2500, grad_fn=<MseLossBackward>)
output :  tensor([[207643.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7187e+10, grad_fn=<MseLossBackward>)
output :  tensor([[191206.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0965e+10, grad_fn=<MseLossBackward>)
output :  tensor([[177299.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(2075085.2500, grad_fn=<MseLossBackward>)
output :  tensor([[151673.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(106469.6484, grad_fn=<MseLossBackward>)
output :  tensor([[329703.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(53245752., grad_fn=<MseLossBackward>)
output :  tensor([[209359.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(6971167.5000, grad_fn=<MseLossBackward>)
output :  tensor([[158084.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(3668960.7500, grad_fn=<MseLossBackward>)
output :  tensor([[188316.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8285e+09, grad_fn=<MseLossBackward>)
output :  tensor([[106422.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(2023217.3750, grad_fn=<MseLossBackward>)
output :  tensor([[275653.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8035e+10, grad_fn=<MseLossBackward>)
output :  tensor([[171280.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(6863990.5000, grad_fn=<MseLossBackward>)
output :  tensor([[217840.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(18836820., grad_fn=<MseLossBackward>)
output :  tensor([[210947.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0105e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177346.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(3434304., grad_fn=<MseLossBackward>)
output :  tensor([[201140.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(435084.5312, grad_fn=<MseLossBackward>)
output :  tensor([[155978.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(958196.2500, grad_fn=<MseLossBackward>)
output :  tensor([[148776.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3792e+09, grad_fn=<MseLossBackward>)
output :  tensor([[119261.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(579192.3750, grad_fn=<MseLossBackward>)
output :  tensor([[140180.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(32744.0332, grad_fn=<MseLossBackward>)
output :  tensor([[148673.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(106734.9297, grad_fn=<MseLossBackward>)
output :  tensor([[200492.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6258e+10, grad_fn=<MseLossBackward>)
output :  tensor([[161565.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(4265580.5000, grad_fn=<MseLossBackward>)
output :  tensor([[100547.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(1096683.5000, grad_fn=<MseLossBackward>)
output :  tensor([[226316.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8724e+08, grad_fn=<MseLossBackward>)
output :  tensor([[185624.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0500e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175427.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1117975.7500, grad_fn=<MseLossBackward>)
output :  tensor([[84743.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(7527564., grad_fn=<MseLossBackward>)
output :  tensor([[128581.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(6574.9292, grad_fn=<MseLossBackward>)
output :  tensor([[212458.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2377185.7500, grad_fn=<MseLossBackward>)
output :  tensor([[143528.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(222209.1250, grad_fn=<MseLossBackward>)
output :  tensor([[130532.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(283140.3750, grad_fn=<MseLossBackward>)
output :  tensor([[143593.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(986918.0625, grad_fn=<MseLossBackward>)
output :  tensor([[176160.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4946e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145141.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1302950.8750, grad_fn=<MseLossBackward>)
output :  tensor([[162382.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(5675115., grad_fn=<MseLossBackward>)
output :  tensor([[214506.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(243912.5156, grad_fn=<MseLossBackward>)
output :  tensor([[136136.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6947e+08, grad_fn=<MseLossBackward>)
output :  tensor([[259882.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(23839570., grad_fn=<MseLossBackward>)
output :  tensor([[156780.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(7395255.5000, grad_fn=<MseLossBackward>)
output :  tensor([[130481.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(3928138.2500, grad_fn=<MseLossBackward>)
output :  tensor([[95571.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(326942.7188, grad_fn=<MseLossBackward>)
output :  tensor([[154779.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9392e+09, grad_fn=<MseLossBackward>)
output :  tensor([[180556.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(431423.1875, grad_fn=<MseLossBackward>)
output :  tensor([[119976.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(273872.3125, grad_fn=<MseLossBackward>)
output :  tensor([[187580.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7115e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144812.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2658e+09, grad_fn=<MseLossBackward>)
output :  tensor([[149046.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(728995.8125, grad_fn=<MseLossBackward>)
output :  tensor([[186972.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(604579.1250, grad_fn=<MseLossBackward>)
output :  tensor([[253147.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5944e+09, grad_fn=<MseLossBackward>)
output :  tensor([[91534.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1159.1897, grad_fn=<MseLossBackward>)
output :  tensor([[239298.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(491663.9062, grad_fn=<MseLossBackward>)
output :  tensor([[126869.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(2659371., grad_fn=<MseLossBackward>)
output :  tensor([[167020.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(9.7772e+09, grad_fn=<MseLossBackward>)
output :  tensor([[114088.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9848e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175660.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(114952.7812, grad_fn=<MseLossBackward>)
output :  tensor([[165178.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6453e+08, grad_fn=<MseLossBackward>)
output :  tensor([[154405.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7147e+08, grad_fn=<MseLossBackward>)
output :  tensor([[237021.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(3915575.2500, grad_fn=<MseLossBackward>)
output :  tensor([[224533.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1200e+09, grad_fn=<MseLossBackward>)
output :  tensor([[128159.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1345491.2500, grad_fn=<MseLossBackward>)
output :  tensor([[128987.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(8924689., grad_fn=<MseLossBackward>)
output :  tensor([[224259.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(7508970., grad_fn=<MseLossBackward>)
output :  tensor([[232744.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1575731., grad_fn=<MseLossBackward>)
output :  tensor([[227484.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(615857.0625, grad_fn=<MseLossBackward>)
output :  tensor([[147318.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(463803.5625, grad_fn=<MseLossBackward>)
output :  tensor([[212434.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(5927246.5000, grad_fn=<MseLossBackward>)
output :  tensor([[130846.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1765e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135030.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(6404774.5000, grad_fn=<MseLossBackward>)
output :  tensor([[309691.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(28180172., grad_fn=<MseLossBackward>)
output :  tensor([[141941.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(887246.2500, grad_fn=<MseLossBackward>)
output :  tensor([[121568.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9777e+09, grad_fn=<MseLossBackward>)
output :  tensor([[108820.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(462187.5312, grad_fn=<MseLossBackward>)
output :  tensor([[158435.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9781e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180449.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8878e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174620.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2624602.5000, grad_fn=<MseLossBackward>)
output :  tensor([[190973.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0052e+08, grad_fn=<MseLossBackward>)
output :  tensor([[102228.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(4966734.5000, grad_fn=<MseLossBackward>)
output :  tensor([[178195.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(646742.6875, grad_fn=<MseLossBackward>)
output :  tensor([[166284.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2609789.7500, grad_fn=<MseLossBackward>)
output :  tensor([[142877.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(15031856., grad_fn=<MseLossBackward>)
output :  tensor([[263110.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2140e+09, grad_fn=<MseLossBackward>)
output :  tensor([[143006.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3648e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174214.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1475579.6250, grad_fn=<MseLossBackward>)
output :  tensor([[139390.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(371985.6250, grad_fn=<MseLossBackward>)
output :  tensor([[200935.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(189918.9219, grad_fn=<MseLossBackward>)
output :  tensor([[166427.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(12760970., grad_fn=<MseLossBackward>)
output :  tensor([[245030.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1061769.2500, grad_fn=<MseLossBackward>)
output :  tensor([[133369.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1277818.2500, grad_fn=<MseLossBackward>)
output :  tensor([[151775.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(5881686., grad_fn=<MseLossBackward>)
output :  tensor([[214760.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(57562.5078, grad_fn=<MseLossBackward>)
output :  tensor([[163049.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(3803109.5000, grad_fn=<MseLossBackward>)
output :  tensor([[197701.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(75708488., grad_fn=<MseLossBackward>)
output :  tensor([[130032.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3910e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129480.]], grad_fn=<AddmmBackward>)
loss:  tensor(230400., grad_fn=<MseLossBackward>)
output :  tensor([[139483.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(266272.1250, grad_fn=<MseLossBackward>)
output :  tensor([[202257.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5216e+09, grad_fn=<MseLossBackward>)
output :  tensor([[168092.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8188e+09, grad_fn=<MseLossBackward>)
output :  tensor([[75977.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5527e+08, grad_fn=<MseLossBackward>)
output :  tensor([[94260.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(95264768., grad_fn=<MseLossBackward>)
output :  tensor([[248660.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(21461504., grad_fn=<MseLossBackward>)
output :  tensor([[204178.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2483e+09, grad_fn=<MseLossBackward>)
output :  tensor([[115991.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(983552.5625, grad_fn=<MseLossBackward>)
output :  tensor([[159372.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9117e+08, grad_fn=<MseLossBackward>)
output :  tensor([[211800.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(67224880., grad_fn=<MseLossBackward>)
output :  tensor([[181078.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9071e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157451.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(6011767.5000, grad_fn=<MseLossBackward>)
output :  tensor([[168030.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(3877945.5000, grad_fn=<MseLossBackward>)
output :  tensor([[117371.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(5625939.5000, grad_fn=<MseLossBackward>)
output :  tensor([[161475.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(41926232., grad_fn=<MseLossBackward>)
output :  tensor([[192896.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9610e+08, grad_fn=<MseLossBackward>)
output :  tensor([[221023.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2321766.5000, grad_fn=<MseLossBackward>)
output :  tensor([[247172.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4783e+11, grad_fn=<MseLossBackward>)
output :  tensor([[149858.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(8168432., grad_fn=<MseLossBackward>)
output :  tensor([[110636.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(4652143.5000, grad_fn=<MseLossBackward>)
output :  tensor([[170371.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3290e+08, grad_fn=<MseLossBackward>)
output :  tensor([[146005.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(20201092., grad_fn=<MseLossBackward>)
output :  tensor([[232646.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(18953642., grad_fn=<MseLossBackward>)
output :  tensor([[115142.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(20384.2539, grad_fn=<MseLossBackward>)
output :  tensor([[184413.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2291439., grad_fn=<MseLossBackward>)
output :  tensor([[186178.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(272157.8438, grad_fn=<MseLossBackward>)
output :  tensor([[164703.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4117e+10, grad_fn=<MseLossBackward>)
output :  tensor([[94770.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8963e+08, grad_fn=<MseLossBackward>)
output :  tensor([[236389.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(6813731.5000, grad_fn=<MseLossBackward>)
output :  tensor([[178474.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(6123459.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140317.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(100667.3906, grad_fn=<MseLossBackward>)
output :  tensor([[237328.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(5420675.5000, grad_fn=<MseLossBackward>)
output :  tensor([[164433.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2054295.1250, grad_fn=<MseLossBackward>)
output :  tensor([[203986.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4644e+10, grad_fn=<MseLossBackward>)
output :  tensor([[136153.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1329877.5000, grad_fn=<MseLossBackward>)
output :  tensor([[186846.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1733e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134893.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1224169.3750, grad_fn=<MseLossBackward>)
output :  tensor([[226338.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(93351832., grad_fn=<MseLossBackward>)
output :  tensor([[225997.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7611e+08, grad_fn=<MseLossBackward>)
output :  tensor([[89899.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(10152.1367, grad_fn=<MseLossBackward>)
output :  tensor([[163886.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(19824896., grad_fn=<MseLossBackward>)
output :  tensor([[245471.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5727e+10, grad_fn=<MseLossBackward>)
output :  tensor([[147158.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(4657773.5000, grad_fn=<MseLossBackward>)
output :  tensor([[108030.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6835e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164949.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(201825.5625, grad_fn=<MseLossBackward>)
output :  tensor([[148224.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(17847588., grad_fn=<MseLossBackward>)
output :  tensor([[130540.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(5480061.5000, grad_fn=<MseLossBackward>)
output :  tensor([[189781.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7912e+09, grad_fn=<MseLossBackward>)
output :  tensor([[124402.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(3620309., grad_fn=<MseLossBackward>)
output :  tensor([[152140.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(19784.1797, grad_fn=<MseLossBackward>)
output :  tensor([[168792.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(8749579., grad_fn=<MseLossBackward>)
output :  tensor([[147746.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(10582822., grad_fn=<MseLossBackward>)
output :  tensor([[159046.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(14847295., grad_fn=<MseLossBackward>)
output :  tensor([[135684.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1208e+08, grad_fn=<MseLossBackward>)
output :  tensor([[132474.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(225239.2344, grad_fn=<MseLossBackward>)
output :  tensor([[153047.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9733e+08, grad_fn=<MseLossBackward>)
output :  tensor([[145828.]], grad_fn=<AddmmBackward>)
loss:  tensor(2808976., grad_fn=<MseLossBackward>)
output :  tensor([[156901.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(23505680., grad_fn=<MseLossBackward>)
output :  tensor([[135055.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3281e+08, grad_fn=<MseLossBackward>)
output :  tensor([[150082.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1644285.2500, grad_fn=<MseLossBackward>)
output :  tensor([[183331.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(21792120., grad_fn=<MseLossBackward>)
output :  tensor([[172627.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(13161250., grad_fn=<MseLossBackward>)
output :  tensor([[179849.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(22607.9414, grad_fn=<MseLossBackward>)
output :  tensor([[221284.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1649017.1250, grad_fn=<MseLossBackward>)
output :  tensor([[110753.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(8140902., grad_fn=<MseLossBackward>)
output :  tensor([[137836.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6735e+08, grad_fn=<MseLossBackward>)
output :  tensor([[284390.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2589082.2500, grad_fn=<MseLossBackward>)
output :  tensor([[117856.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(3445403., grad_fn=<MseLossBackward>)
output :  tensor([[177244.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8280e+09, grad_fn=<MseLossBackward>)
output :  tensor([[184045.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(910354.5000, grad_fn=<MseLossBackward>)
output :  tensor([[185916.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(173797.7969, grad_fn=<MseLossBackward>)
output :  tensor([[250935.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7911e+08, grad_fn=<MseLossBackward>)
output :  tensor([[218226.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(14237769., grad_fn=<MseLossBackward>)
output :  tensor([[127317.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5869e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174825.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7634e+08, grad_fn=<MseLossBackward>)
output :  tensor([[126884.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(8323044.5000, grad_fn=<MseLossBackward>)
output :  tensor([[182681.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5586e+10, grad_fn=<MseLossBackward>)
output :  tensor([[153242.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(58654.7852, grad_fn=<MseLossBackward>)
output :  tensor([[155535.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(81645904., grad_fn=<MseLossBackward>)
output :  tensor([[202177.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(16993976., grad_fn=<MseLossBackward>)
output :  tensor([[144849.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5252e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173856.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(4596066., grad_fn=<MseLossBackward>)
output :  tensor([[252148.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4809e+08, grad_fn=<MseLossBackward>)
output :  tensor([[149006.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1013923.1250, grad_fn=<MseLossBackward>)
output :  tensor([[201517.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1317150.7500, grad_fn=<MseLossBackward>)
output :  tensor([[167432.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(55984064., grad_fn=<MseLossBackward>)
output :  tensor([[121005.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0894e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136198.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(200942.0781, grad_fn=<MseLossBackward>)
output :  tensor([[183122.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(770417.6250, grad_fn=<MseLossBackward>)
output :  tensor([[197964.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(63435748., grad_fn=<MseLossBackward>)
output :  tensor([[235436.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8691e+09, grad_fn=<MseLossBackward>)
output :  tensor([[257369.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(136484.0625, grad_fn=<MseLossBackward>)
output :  tensor([[186308.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7607e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143942.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7502e+09, grad_fn=<MseLossBackward>)
output :  tensor([[143216.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1648455.3750, grad_fn=<MseLossBackward>)
output :  tensor([[69937.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(8.9627e+08, grad_fn=<MseLossBackward>)
output :  tensor([[138540.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(12533591., grad_fn=<MseLossBackward>)
output :  tensor([[131263.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(5587388., grad_fn=<MseLossBackward>)
output :  tensor([[158336.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(18801302., grad_fn=<MseLossBackward>)
output :  tensor([[126309.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(476326.4375, grad_fn=<MseLossBackward>)
output :  tensor([[77154.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(428390.7188, grad_fn=<MseLossBackward>)
output :  tensor([[82742.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(551584.7500, grad_fn=<MseLossBackward>)
output :  tensor([[228319.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(13545965., grad_fn=<MseLossBackward>)
output :  tensor([[141977.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(8.6891e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134730.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(17900964., grad_fn=<MseLossBackward>)
output :  tensor([[167060.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(3662.1409, grad_fn=<MseLossBackward>)
output :  tensor([[232213.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(7765366., grad_fn=<MseLossBackward>)
output :  tensor([[191288.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(725664.3750, grad_fn=<MseLossBackward>)
output :  tensor([[153817.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(4764534., grad_fn=<MseLossBackward>)
output :  tensor([[196992.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(823981.6875, grad_fn=<MseLossBackward>)
output :  tensor([[205589.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(9.8659e+08, grad_fn=<MseLossBackward>)
output :  tensor([[138217.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1481469.3750, grad_fn=<MseLossBackward>)
output :  tensor([[155236.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(55718.1289, grad_fn=<MseLossBackward>)
output :  tensor([[136943.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(889985.8750, grad_fn=<MseLossBackward>)
output :  tensor([[200319.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8094e+08, grad_fn=<MseLossBackward>)
output :  tensor([[156094.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(4387715.5000, grad_fn=<MseLossBackward>)
output :  tensor([[136273.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8296e+09, grad_fn=<MseLossBackward>)
output :  tensor([[147028.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(4530978., grad_fn=<MseLossBackward>)
output :  tensor([[206691.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(28184486., grad_fn=<MseLossBackward>)
output :  tensor([[97664.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4537e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165707.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(3212104., grad_fn=<MseLossBackward>)
output :  tensor([[131424.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(11730411., grad_fn=<MseLossBackward>)
output :  tensor([[144689.]], grad_fn=<AddmmBackward>)
loss:  tensor(5340721., grad_fn=<MseLossBackward>)
output :  tensor([[102554.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6137e+09, grad_fn=<MseLossBackward>)
output :  tensor([[138461.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(923821.3125, grad_fn=<MseLossBackward>)
output :  tensor([[234347.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2730498., grad_fn=<MseLossBackward>)
output :  tensor([[145483.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(233832.6875, grad_fn=<MseLossBackward>)
output :  tensor([[138118.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(382890.2500, grad_fn=<MseLossBackward>)
output :  tensor([[164895.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3613e+09, grad_fn=<MseLossBackward>)
output :  tensor([[270355.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(58439336., grad_fn=<MseLossBackward>)
output :  tensor([[176430.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2046330.2500, grad_fn=<MseLossBackward>)
output :  tensor([[102991.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(46399.8516, grad_fn=<MseLossBackward>)
output :  tensor([[202527.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6208e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159834.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(697042.3750, grad_fn=<MseLossBackward>)
output :  tensor([[163152.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5913e+10, grad_fn=<MseLossBackward>)
output :  tensor([[100741.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(5960541., grad_fn=<MseLossBackward>)
output :  tensor([[122081.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2304419., grad_fn=<MseLossBackward>)
output :  tensor([[154536.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2142426.7500, grad_fn=<MseLossBackward>)
output :  tensor([[142232.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(4985591., grad_fn=<MseLossBackward>)
output :  tensor([[199501.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(248128.5156, grad_fn=<MseLossBackward>)
output :  tensor([[143923.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(3700393.2500, grad_fn=<MseLossBackward>)
output :  tensor([[260781.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2244519., grad_fn=<MseLossBackward>)
output :  tensor([[124823.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0127e+09, grad_fn=<MseLossBackward>)
output :  tensor([[162545.]], grad_fn=<AddmmBackward>)
loss:  tensor(8732025., grad_fn=<MseLossBackward>)
output :  tensor([[185835.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(7097645.5000, grad_fn=<MseLossBackward>)
output :  tensor([[124282.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0399e+08, grad_fn=<MseLossBackward>)
output :  tensor([[254593.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(21098664., grad_fn=<MseLossBackward>)
output :  tensor([[158549.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0945e+08, grad_fn=<MseLossBackward>)
output :  tensor([[243128.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4936728.5000, grad_fn=<MseLossBackward>)
output :  tensor([[141304.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(7264793.5000, grad_fn=<MseLossBackward>)
output :  tensor([[208802.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1434492.7500, grad_fn=<MseLossBackward>)
output :  tensor([[177498.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(25994862., grad_fn=<MseLossBackward>)
output :  tensor([[153316.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(466574.3750, grad_fn=<MseLossBackward>)
output :  tensor([[121900.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(15216399., grad_fn=<MseLossBackward>)
output :  tensor([[239160.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2972e+09, grad_fn=<MseLossBackward>)
output :  tensor([[238194.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(3261241., grad_fn=<MseLossBackward>)
output :  tensor([[148242.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(25954886., grad_fn=<MseLossBackward>)
output :  tensor([[253760.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1298282.2500, grad_fn=<MseLossBackward>)
output :  tensor([[123134.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(74484992., grad_fn=<MseLossBackward>)
output :  tensor([[176238.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(56740.7305, grad_fn=<MseLossBackward>)
output :  tensor([[160018.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(338.2151, grad_fn=<MseLossBackward>)
output :  tensor([[130676.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(104419.8672, grad_fn=<MseLossBackward>)
output :  tensor([[191887.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8922e+09, grad_fn=<MseLossBackward>)
output :  tensor([[167656.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(13372735., grad_fn=<MseLossBackward>)
output :  tensor([[164173.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1376735.5000, grad_fn=<MseLossBackward>)
output :  tensor([[157635.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(133076.7656, grad_fn=<MseLossBackward>)
output :  tensor([[144267.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(31721712., grad_fn=<MseLossBackward>)
output :  tensor([[170721.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7481e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158392.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2584960.5000, grad_fn=<MseLossBackward>)
output :  tensor([[378845.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(26257938., grad_fn=<MseLossBackward>)
output :  tensor([[138388.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2969e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130958.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0665e+09, grad_fn=<MseLossBackward>)
output :  tensor([[275372.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(34116552., grad_fn=<MseLossBackward>)
output :  tensor([[163460.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2133197.2500, grad_fn=<MseLossBackward>)
output :  tensor([[132105.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3469e+08, grad_fn=<MseLossBackward>)
output :  tensor([[230370.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2655575.7500, grad_fn=<MseLossBackward>)
output :  tensor([[179333.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1359628.8750, grad_fn=<MseLossBackward>)
output :  tensor([[155484.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(12138909., grad_fn=<MseLossBackward>)
output :  tensor([[144808.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(36678.2344, grad_fn=<MseLossBackward>)
output :  tensor([[153334.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7010e+08, grad_fn=<MseLossBackward>)
output :  tensor([[99503.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(246380.3906, grad_fn=<MseLossBackward>)
output :  tensor([[76965.1016]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8781e+08, grad_fn=<MseLossBackward>)
output :  tensor([[164400.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(359306.5938, grad_fn=<MseLossBackward>)
output :  tensor([[189655.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4703e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163388.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(29035932., grad_fn=<MseLossBackward>)
output :  tensor([[169831.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5207e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137592.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(20270.6406, grad_fn=<MseLossBackward>)
output :  tensor([[208383.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(5920325.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140633.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(6932853.5000, grad_fn=<MseLossBackward>)
output :  tensor([[183769.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5934e+10, grad_fn=<MseLossBackward>)
output :  tensor([[150646.]], grad_fn=<AddmmBackward>)
loss:  tensor(21585316., grad_fn=<MseLossBackward>)
output :  tensor([[109175.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8518e+08, grad_fn=<MseLossBackward>)
output :  tensor([[96275.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(5179536., grad_fn=<MseLossBackward>)
output :  tensor([[174129.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(756954.3750, grad_fn=<MseLossBackward>)
output :  tensor([[257289.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(9674141., grad_fn=<MseLossBackward>)
output :  tensor([[141685.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(34445.0391, grad_fn=<MseLossBackward>)
output :  tensor([[158581.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1726390.7500, grad_fn=<MseLossBackward>)
output :  tensor([[133978.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2187348.5000, grad_fn=<MseLossBackward>)
output :  tensor([[149122.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(142706.8750, grad_fn=<MseLossBackward>)
output :  tensor([[169717.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(3303817.5000, grad_fn=<MseLossBackward>)
output :  tensor([[124301.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(7281270., grad_fn=<MseLossBackward>)
output :  tensor([[171171.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8497e+08, grad_fn=<MseLossBackward>)
output :  tensor([[157425.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(180664.8438, grad_fn=<MseLossBackward>)
output :  tensor([[116588.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(7859.9307, grad_fn=<MseLossBackward>)
output :  tensor([[159657.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3791e+09, grad_fn=<MseLossBackward>)
output :  tensor([[52975.5898]], grad_fn=<AddmmBackward>)
loss:  tensor(951775.5625, grad_fn=<MseLossBackward>)
output :  tensor([[231094.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6268e+09, grad_fn=<MseLossBackward>)
output :  tensor([[200312.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(472634.7812, grad_fn=<MseLossBackward>)
output :  tensor([[184773.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(51351.8086, grad_fn=<MseLossBackward>)
output :  tensor([[106411.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(169293.6719, grad_fn=<MseLossBackward>)
output :  tensor([[85736.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1595287.3750, grad_fn=<MseLossBackward>)
output :  tensor([[145360.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(28733118., grad_fn=<MseLossBackward>)
output :  tensor([[223400.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9842e+09, grad_fn=<MseLossBackward>)
output :  tensor([[205483.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(4066020.2500, grad_fn=<MseLossBackward>)
output :  tensor([[166322.]], grad_fn=<AddmmBackward>)
loss:  tensor(1747684., grad_fn=<MseLossBackward>)
output :  tensor([[175254.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0542e+09, grad_fn=<MseLossBackward>)
output :  tensor([[187900.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(4407703.5000, grad_fn=<MseLossBackward>)
output :  tensor([[88672.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2796106.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139470.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(280436.4375, grad_fn=<MseLossBackward>)
output :  tensor([[112822.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(5392228., grad_fn=<MseLossBackward>)
output :  tensor([[147025.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2244e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173156.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7772e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192953.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4512e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179631.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(135942., grad_fn=<MseLossBackward>)
output :  tensor([[99304.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(7864081., grad_fn=<MseLossBackward>)
output :  tensor([[117162.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(114090.8984, grad_fn=<MseLossBackward>)
output :  tensor([[162642.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5613e+08, grad_fn=<MseLossBackward>)
output :  tensor([[197664.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(5455290., grad_fn=<MseLossBackward>)
output :  tensor([[147200.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(10243500., grad_fn=<MseLossBackward>)
train_loss: [2.573742e+09]
epoch_result tensor([0.])
output :  tensor([[159546.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1094933.3750, grad_fn=<MseLossBackward>)
output :  tensor([[126347.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(18903882., grad_fn=<MseLossBackward>)
output :  tensor([[196676.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(6127558.5000, grad_fn=<MseLossBackward>)
output :  tensor([[176273.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(527870.3750, grad_fn=<MseLossBackward>)
output :  tensor([[154540.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5037e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128889.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(790654.4375, grad_fn=<MseLossBackward>)
output :  tensor([[141353.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(124851.8047, grad_fn=<MseLossBackward>)
output :  tensor([[118790.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(43828.0781, grad_fn=<MseLossBackward>)
output :  tensor([[67279.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(77081400., grad_fn=<MseLossBackward>)
output :  tensor([[166663.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(440335.9375, grad_fn=<MseLossBackward>)
output :  tensor([[143718.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(13827707., grad_fn=<MseLossBackward>)
output :  tensor([[225732.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(536167.1875, grad_fn=<MseLossBackward>)
output :  tensor([[168682.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(100806.2500, grad_fn=<MseLossBackward>)
output :  tensor([[248912.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(620328.5000, grad_fn=<MseLossBackward>)
output :  tensor([[58241.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(10509247., grad_fn=<MseLossBackward>)
output :  tensor([[161493.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8877e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166626.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(70122048., grad_fn=<MseLossBackward>)
output :  tensor([[154788.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(2930462.5000, grad_fn=<MseLossBackward>)
output :  tensor([[276661.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2761620.7500, grad_fn=<MseLossBackward>)
output :  tensor([[194345.]], grad_fn=<AddmmBackward>)
loss:  tensor(7049025., grad_fn=<MseLossBackward>)
output :  tensor([[139419.]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4573e+10, grad_fn=<MseLossBackward>)
output :  tensor([[195328.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2101820.2500, grad_fn=<MseLossBackward>)
output :  tensor([[181011.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9262e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150862.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(18906.2500, grad_fn=<MseLossBackward>)
output :  tensor([[164275.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(32772226., grad_fn=<MseLossBackward>)
output :  tensor([[84857.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(293958.8125, grad_fn=<MseLossBackward>)
output :  tensor([[170729.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3327e+09, grad_fn=<MseLossBackward>)
output :  tensor([[187048.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(4195904., grad_fn=<MseLossBackward>)
output :  tensor([[209913.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0782e+09, grad_fn=<MseLossBackward>)
output :  tensor([[109691.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(95321.7422, grad_fn=<MseLossBackward>)
output :  tensor([[169804.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1430341.2500, grad_fn=<MseLossBackward>)
output :  tensor([[135397.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1216505.6250, grad_fn=<MseLossBackward>)
output :  tensor([[128728.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(73508.7656, grad_fn=<MseLossBackward>)
output :  tensor([[122438.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(8635471., grad_fn=<MseLossBackward>)
output :  tensor([[144931.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8018e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166941.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1921e+10, grad_fn=<MseLossBackward>)
output :  tensor([[147385.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(5354740.5000, grad_fn=<MseLossBackward>)
output :  tensor([[183120.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(9738690., grad_fn=<MseLossBackward>)
output :  tensor([[141661.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(437003.6250, grad_fn=<MseLossBackward>)
output :  tensor([[107641.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1123e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137708.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9740e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137672.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(7144845.5000, grad_fn=<MseLossBackward>)
output :  tensor([[136007.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(81143784., grad_fn=<MseLossBackward>)
output :  tensor([[221536.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(11997456., grad_fn=<MseLossBackward>)
output :  tensor([[134491.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(5025863.5000, grad_fn=<MseLossBackward>)
output :  tensor([[151810.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(7896627., grad_fn=<MseLossBackward>)
output :  tensor([[118382.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(40732316., grad_fn=<MseLossBackward>)
output :  tensor([[160896.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(804468.8750, grad_fn=<MseLossBackward>)
output :  tensor([[146428.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3592e+09, grad_fn=<MseLossBackward>)
output :  tensor([[191518.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(231631.6406, grad_fn=<MseLossBackward>)
output :  tensor([[134058.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(153211.0781, grad_fn=<MseLossBackward>)
output :  tensor([[101810.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(67069444., grad_fn=<MseLossBackward>)
output :  tensor([[231498.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(6255939., grad_fn=<MseLossBackward>)
output :  tensor([[167991.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0701e+09, grad_fn=<MseLossBackward>)
output :  tensor([[156844.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(4644900.5000, grad_fn=<MseLossBackward>)
output :  tensor([[205144.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8008e+10, grad_fn=<MseLossBackward>)
output :  tensor([[247479.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1347e+10, grad_fn=<MseLossBackward>)
output :  tensor([[142669.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(689107.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128862.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(26397680., grad_fn=<MseLossBackward>)
output :  tensor([[155609.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(371795.0625, grad_fn=<MseLossBackward>)
output :  tensor([[133846.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(14795081., grad_fn=<MseLossBackward>)
output :  tensor([[182264.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0428e+09, grad_fn=<MseLossBackward>)
output :  tensor([[184537.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(191474.6094, grad_fn=<MseLossBackward>)
output :  tensor([[160209.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1664503.1250, grad_fn=<MseLossBackward>)
output :  tensor([[135130.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(61933212., grad_fn=<MseLossBackward>)
output :  tensor([[143696.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1430453.3750, grad_fn=<MseLossBackward>)
output :  tensor([[148938.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(15509198., grad_fn=<MseLossBackward>)
output :  tensor([[173844.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3351e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195245.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7325e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137525.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1052547.7500, grad_fn=<MseLossBackward>)
output :  tensor([[177557.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(32012788., grad_fn=<MseLossBackward>)
output :  tensor([[178021.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(8874069., grad_fn=<MseLossBackward>)
output :  tensor([[116052.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1107098.5000, grad_fn=<MseLossBackward>)
output :  tensor([[217154.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(14786188., grad_fn=<MseLossBackward>)
output :  tensor([[184739.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1536437.7500, grad_fn=<MseLossBackward>)
output :  tensor([[128172.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(7143467.5000, grad_fn=<MseLossBackward>)
output :  tensor([[199828.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(11080369., grad_fn=<MseLossBackward>)
output :  tensor([[176598.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2885220.7500, grad_fn=<MseLossBackward>)
output :  tensor([[213763.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9752e+10, grad_fn=<MseLossBackward>)
output :  tensor([[210002.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(995380.3750, grad_fn=<MseLossBackward>)
output :  tensor([[167547.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3357e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195318.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(670556.2500, grad_fn=<MseLossBackward>)
output :  tensor([[110266.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(7470741., grad_fn=<MseLossBackward>)
output :  tensor([[115947.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(11886711., grad_fn=<MseLossBackward>)
output :  tensor([[112581.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(338587.5938, grad_fn=<MseLossBackward>)
output :  tensor([[146993.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(37412.0234, grad_fn=<MseLossBackward>)
output :  tensor([[160809.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3063e+10, grad_fn=<MseLossBackward>)
output :  tensor([[177772.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(4963079., grad_fn=<MseLossBackward>)
output :  tensor([[128230.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(534132.5625, grad_fn=<MseLossBackward>)
output :  tensor([[145242.]], grad_fn=<AddmmBackward>)
loss:  tensor(58564., grad_fn=<MseLossBackward>)
output :  tensor([[182667.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2817e+09, grad_fn=<MseLossBackward>)
output :  tensor([[119643.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(7528207., grad_fn=<MseLossBackward>)
output :  tensor([[195916.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1173159.7500, grad_fn=<MseLossBackward>)
output :  tensor([[144566.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(187949.3438, grad_fn=<MseLossBackward>)
output :  tensor([[212180.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(517815.1562, grad_fn=<MseLossBackward>)
output :  tensor([[128349.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(5519342.5000, grad_fn=<MseLossBackward>)
output :  tensor([[243784.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(20644386., grad_fn=<MseLossBackward>)
output :  tensor([[239430.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0766e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144224.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6446e+08, grad_fn=<MseLossBackward>)
output :  tensor([[85224.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8684e+08, grad_fn=<MseLossBackward>)
output :  tensor([[196327.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1736e+09, grad_fn=<MseLossBackward>)
output :  tensor([[83666.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(7110847., grad_fn=<MseLossBackward>)
output :  tensor([[139529.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(879.4932, grad_fn=<MseLossBackward>)
output :  tensor([[75817.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(101029.6172, grad_fn=<MseLossBackward>)
output :  tensor([[144704.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(3066384., grad_fn=<MseLossBackward>)
output :  tensor([[177401.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1964070.8750, grad_fn=<MseLossBackward>)
output :  tensor([[153440.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(3555.1406, grad_fn=<MseLossBackward>)
output :  tensor([[109051.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(2727633., grad_fn=<MseLossBackward>)
output :  tensor([[204083.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2469e+10, grad_fn=<MseLossBackward>)
output :  tensor([[128977.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(228416.7812, grad_fn=<MseLossBackward>)
output :  tensor([[267664.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5217e+08, grad_fn=<MseLossBackward>)
output :  tensor([[305429.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(20890898., grad_fn=<MseLossBackward>)
output :  tensor([[105679.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(3315785., grad_fn=<MseLossBackward>)
output :  tensor([[170487.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(4048584.2500, grad_fn=<MseLossBackward>)
output :  tensor([[135710.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6790e+08, grad_fn=<MseLossBackward>)
output :  tensor([[132218.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(45990224., grad_fn=<MseLossBackward>)
output :  tensor([[131053.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(645762.9375, grad_fn=<MseLossBackward>)
output :  tensor([[126686.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(2845310., grad_fn=<MseLossBackward>)
output :  tensor([[134661.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3308e+08, grad_fn=<MseLossBackward>)
output :  tensor([[226382.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8658e+10, grad_fn=<MseLossBackward>)
output :  tensor([[187871.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3448e+10, grad_fn=<MseLossBackward>)
output :  tensor([[140674.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(10404556., grad_fn=<MseLossBackward>)
output :  tensor([[131664.]], grad_fn=<AddmmBackward>)
loss:  tensor(17338896., grad_fn=<MseLossBackward>)
output :  tensor([[111228.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(453.2242, grad_fn=<MseLossBackward>)
output :  tensor([[254737.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0098e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136572.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2472019.2500, grad_fn=<MseLossBackward>)
output :  tensor([[206117.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(9717637., grad_fn=<MseLossBackward>)
output :  tensor([[104850.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2470.4006, grad_fn=<MseLossBackward>)
output :  tensor([[139218.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(534406.6875, grad_fn=<MseLossBackward>)
output :  tensor([[209443.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2669e+08, grad_fn=<MseLossBackward>)
output :  tensor([[183438.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(12519545., grad_fn=<MseLossBackward>)
output :  tensor([[187524.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(6372074.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163454.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1184e+10, grad_fn=<MseLossBackward>)
output :  tensor([[301197.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1426e+09, grad_fn=<MseLossBackward>)
output :  tensor([[201950.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(16408196., grad_fn=<MseLossBackward>)
output :  tensor([[261706.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9925e+10, grad_fn=<MseLossBackward>)
output :  tensor([[224098.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7557e+09, grad_fn=<MseLossBackward>)
output :  tensor([[288009.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4044e+08, grad_fn=<MseLossBackward>)
output :  tensor([[223255.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(554233.7500, grad_fn=<MseLossBackward>)
output :  tensor([[222855.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8610e+10, grad_fn=<MseLossBackward>)
output :  tensor([[199004.]], grad_fn=<AddmmBackward>)
loss:  tensor(4016016., grad_fn=<MseLossBackward>)
output :  tensor([[159377.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2281e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131534.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(931405.9375, grad_fn=<MseLossBackward>)
output :  tensor([[137694.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(4817956.5000, grad_fn=<MseLossBackward>)
output :  tensor([[90372.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(394217.2188, grad_fn=<MseLossBackward>)
output :  tensor([[106042.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(3832142.7500, grad_fn=<MseLossBackward>)
output :  tensor([[271358.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3110e+09, grad_fn=<MseLossBackward>)
output :  tensor([[233221.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(3164340.7500, grad_fn=<MseLossBackward>)
output :  tensor([[144830.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(28571.5625, grad_fn=<MseLossBackward>)
output :  tensor([[138010.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(260323.1719, grad_fn=<MseLossBackward>)
output :  tensor([[175113.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1906470.5000, grad_fn=<MseLossBackward>)
output :  tensor([[146618.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1873348.2500, grad_fn=<MseLossBackward>)
output :  tensor([[165643.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3268e+08, grad_fn=<MseLossBackward>)
output :  tensor([[164334.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(443015.0312, grad_fn=<MseLossBackward>)
output :  tensor([[138924.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(3702557.7500, grad_fn=<MseLossBackward>)
output :  tensor([[189014.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4242e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113038.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1079391.1250, grad_fn=<MseLossBackward>)
output :  tensor([[170562.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2067529.5000, grad_fn=<MseLossBackward>)
output :  tensor([[120293.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(85986.3984, grad_fn=<MseLossBackward>)
output :  tensor([[87208.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(43498.3164, grad_fn=<MseLossBackward>)
output :  tensor([[180747.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(559176.8125, grad_fn=<MseLossBackward>)
output :  tensor([[112068.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(4700461., grad_fn=<MseLossBackward>)
output :  tensor([[240196.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1431986.1250, grad_fn=<MseLossBackward>)
output :  tensor([[244396.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(364740.5000, grad_fn=<MseLossBackward>)
output :  tensor([[134182.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(21925952., grad_fn=<MseLossBackward>)
output :  tensor([[108404.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(307322.9688, grad_fn=<MseLossBackward>)
output :  tensor([[287389.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2429e+10, grad_fn=<MseLossBackward>)
output :  tensor([[170525.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(948797.7500, grad_fn=<MseLossBackward>)
output :  tensor([[127513.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(6319057., grad_fn=<MseLossBackward>)
output :  tensor([[142632.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0677e+08, grad_fn=<MseLossBackward>)
output :  tensor([[202389.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3480e+08, grad_fn=<MseLossBackward>)
output :  tensor([[140604.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(156111.4219, grad_fn=<MseLossBackward>)
output :  tensor([[158713.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4710e+10, grad_fn=<MseLossBackward>)
output :  tensor([[156733.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(8028102.5000, grad_fn=<MseLossBackward>)
output :  tensor([[129916.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(173654.5156, grad_fn=<MseLossBackward>)
output :  tensor([[248586.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6878e+10, grad_fn=<MseLossBackward>)
output :  tensor([[394577.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(55089332., grad_fn=<MseLossBackward>)
output :  tensor([[110479.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(2188157.5000, grad_fn=<MseLossBackward>)
output :  tensor([[117987.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(263128.9375, grad_fn=<MseLossBackward>)
output :  tensor([[160488.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(977842.8750, grad_fn=<MseLossBackward>)
output :  tensor([[129889.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8130e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163158.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4624e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174367.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1432e+09, grad_fn=<MseLossBackward>)
output :  tensor([[104890.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(1664321.7500, grad_fn=<MseLossBackward>)
output :  tensor([[140533.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(217374.5000, grad_fn=<MseLossBackward>)
output :  tensor([[366340.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(909043.0625, grad_fn=<MseLossBackward>)
output :  tensor([[207248.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1857e+09, grad_fn=<MseLossBackward>)
output :  tensor([[181427.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(35140812., grad_fn=<MseLossBackward>)
output :  tensor([[203348.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(200928.0625, grad_fn=<MseLossBackward>)
output :  tensor([[138320.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(461677.7812, grad_fn=<MseLossBackward>)
output :  tensor([[195020.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(271327.0312, grad_fn=<MseLossBackward>)
output :  tensor([[134234.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1473e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178340.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(7074769., grad_fn=<MseLossBackward>)
output :  tensor([[242421.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(177583.2344, grad_fn=<MseLossBackward>)
output :  tensor([[175402.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1967751.3750, grad_fn=<MseLossBackward>)
output :  tensor([[111543.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(12559216., grad_fn=<MseLossBackward>)
output :  tensor([[263189.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1881098., grad_fn=<MseLossBackward>)
output :  tensor([[240874.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(83266768., grad_fn=<MseLossBackward>)
output :  tensor([[120017.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(8897124., grad_fn=<MseLossBackward>)
output :  tensor([[214854.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6175e+09, grad_fn=<MseLossBackward>)
output :  tensor([[306064.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6999e+08, grad_fn=<MseLossBackward>)
output :  tensor([[207420.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(176426.2500, grad_fn=<MseLossBackward>)
output :  tensor([[214209.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5823e+10, grad_fn=<MseLossBackward>)
output :  tensor([[158122.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(49506.2500, grad_fn=<MseLossBackward>)
output :  tensor([[172752.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(7633392., grad_fn=<MseLossBackward>)
output :  tensor([[161186.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(18104094., grad_fn=<MseLossBackward>)
output :  tensor([[167350.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(7018194.5000, grad_fn=<MseLossBackward>)
output :  tensor([[238884.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4773e+08, grad_fn=<MseLossBackward>)
output :  tensor([[221239.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(67511640., grad_fn=<MseLossBackward>)
output :  tensor([[161045.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9728e+08, grad_fn=<MseLossBackward>)
output :  tensor([[123439.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(193435.0312, grad_fn=<MseLossBackward>)
output :  tensor([[176171.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(686205.1250, grad_fn=<MseLossBackward>)
output :  tensor([[179564.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4699e+09, grad_fn=<MseLossBackward>)
output :  tensor([[208741.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4550e+10, grad_fn=<MseLossBackward>)
output :  tensor([[133148.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1647251.8750, grad_fn=<MseLossBackward>)
output :  tensor([[149895.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0066e+08, grad_fn=<MseLossBackward>)
output :  tensor([[278613.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2603584., grad_fn=<MseLossBackward>)
output :  tensor([[86603.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(2569784.2500, grad_fn=<MseLossBackward>)
output :  tensor([[235002.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2242693.5000, grad_fn=<MseLossBackward>)
output :  tensor([[260044.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0426e+11, grad_fn=<MseLossBackward>)
output :  tensor([[169845.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(23735.2539, grad_fn=<MseLossBackward>)
output :  tensor([[196055.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5167e+09, grad_fn=<MseLossBackward>)
output :  tensor([[155082.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(6816.5664, grad_fn=<MseLossBackward>)
output :  tensor([[206491.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0333e+09, grad_fn=<MseLossBackward>)
output :  tensor([[130090.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1189599.2500, grad_fn=<MseLossBackward>)
output :  tensor([[148958.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(15666506., grad_fn=<MseLossBackward>)
output :  tensor([[168711.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8702e+08, grad_fn=<MseLossBackward>)
output :  tensor([[186539.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(475194.8125, grad_fn=<MseLossBackward>)
output :  tensor([[130242.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(18000794., grad_fn=<MseLossBackward>)
output :  tensor([[136811.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(97207.5469, grad_fn=<MseLossBackward>)
output :  tensor([[175220.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(4931245., grad_fn=<MseLossBackward>)
output :  tensor([[196864.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8234e+09, grad_fn=<MseLossBackward>)
output :  tensor([[240997.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(4009318., grad_fn=<MseLossBackward>)
output :  tensor([[154343.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(431094.8438, grad_fn=<MseLossBackward>)
output :  tensor([[195949.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2569.2227, grad_fn=<MseLossBackward>)
output :  tensor([[159997.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5591e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179668.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(28471.2891, grad_fn=<MseLossBackward>)
output :  tensor([[175760.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(17135848., grad_fn=<MseLossBackward>)
output :  tensor([[97324.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(105036.7578, grad_fn=<MseLossBackward>)
output :  tensor([[171657.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1738e+10, grad_fn=<MseLossBackward>)
output :  tensor([[133424.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2481511., grad_fn=<MseLossBackward>)
output :  tensor([[122077.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(50093992., grad_fn=<MseLossBackward>)
output :  tensor([[174680.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(463526.9375, grad_fn=<MseLossBackward>)
output :  tensor([[85394.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(155426.9062, grad_fn=<MseLossBackward>)
output :  tensor([[282921.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(50104720., grad_fn=<MseLossBackward>)
output :  tensor([[168807.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(14496461., grad_fn=<MseLossBackward>)
output :  tensor([[192473.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9795e+10, grad_fn=<MseLossBackward>)
output :  tensor([[247415.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5621e+08, grad_fn=<MseLossBackward>)
output :  tensor([[149265.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3008056.7500, grad_fn=<MseLossBackward>)
output :  tensor([[120358.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(13263993., grad_fn=<MseLossBackward>)
output :  tensor([[118293.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(2581520., grad_fn=<MseLossBackward>)
output :  tensor([[141817.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1919e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175389.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1931405., grad_fn=<MseLossBackward>)
output :  tensor([[111243.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2617e+08, grad_fn=<MseLossBackward>)
output :  tensor([[213875.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0842e+10, grad_fn=<MseLossBackward>)
output :  tensor([[238354.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(9895252., grad_fn=<MseLossBackward>)
output :  tensor([[254654.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9751e+10, grad_fn=<MseLossBackward>)
output :  tensor([[223217.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4909e+08, grad_fn=<MseLossBackward>)
output :  tensor([[196087.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4259e+10, grad_fn=<MseLossBackward>)
output :  tensor([[190106.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(6791562., grad_fn=<MseLossBackward>)
output :  tensor([[210471.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5967e+10, grad_fn=<MseLossBackward>)
output :  tensor([[189187.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1554e+10, grad_fn=<MseLossBackward>)
output :  tensor([[181148.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(5801324., grad_fn=<MseLossBackward>)
output :  tensor([[153089.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1186703.8750, grad_fn=<MseLossBackward>)
output :  tensor([[333968.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(9190750., grad_fn=<MseLossBackward>)
output :  tensor([[212285.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(81287.3594, grad_fn=<MseLossBackward>)
output :  tensor([[162094.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(4388305., grad_fn=<MseLossBackward>)
output :  tensor([[186113.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0677e+09, grad_fn=<MseLossBackward>)
output :  tensor([[103442.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(2426463.2500, grad_fn=<MseLossBackward>)
output :  tensor([[273325.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9341e+10, grad_fn=<MseLossBackward>)
output :  tensor([[171595.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(5311224.5000, grad_fn=<MseLossBackward>)
output :  tensor([[215720.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(4931453., grad_fn=<MseLossBackward>)
output :  tensor([[210693.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0623e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176892.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(5323474.5000, grad_fn=<MseLossBackward>)
output :  tensor([[203982.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4761669.5000, grad_fn=<MseLossBackward>)
output :  tensor([[155536.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(287647.8438, grad_fn=<MseLossBackward>)
output :  tensor([[147435.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2501e+09, grad_fn=<MseLossBackward>)
output :  tensor([[117166.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(1777868., grad_fn=<MseLossBackward>)
output :  tensor([[139409.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(348136.8750, grad_fn=<MseLossBackward>)
output :  tensor([[148951.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2362.8713, grad_fn=<MseLossBackward>)
output :  tensor([[202817.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5671e+10, grad_fn=<MseLossBackward>)
output :  tensor([[160315.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(665244.1250, grad_fn=<MseLossBackward>)
output :  tensor([[100268.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(590976.5625, grad_fn=<MseLossBackward>)
output :  tensor([[229303.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1442e+08, grad_fn=<MseLossBackward>)
output :  tensor([[185794.]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1185e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176213.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(73933.0078, grad_fn=<MseLossBackward>)
output :  tensor([[84621.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(6870992.5000, grad_fn=<MseLossBackward>)
output :  tensor([[127514.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(971395.0625, grad_fn=<MseLossBackward>)
output :  tensor([[218287.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(18384666., grad_fn=<MseLossBackward>)
output :  tensor([[143333.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(444138.9375, grad_fn=<MseLossBackward>)
output :  tensor([[129490.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(259208.2656, grad_fn=<MseLossBackward>)
output :  tensor([[143422.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(676352.0625, grad_fn=<MseLossBackward>)
output :  tensor([[178078.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6466e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144443.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(196692.2500, grad_fn=<MseLossBackward>)
output :  tensor([[159770.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(52476.7891, grad_fn=<MseLossBackward>)
output :  tensor([[216839.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3385082.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138372.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1137e+09, grad_fn=<MseLossBackward>)
output :  tensor([[257625.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(6891445.5000, grad_fn=<MseLossBackward>)
output :  tensor([[161146.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2711476.7500, grad_fn=<MseLossBackward>)
output :  tensor([[131183.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(7201256., grad_fn=<MseLossBackward>)
output :  tensor([[94889.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(12315.7979, grad_fn=<MseLossBackward>)
output :  tensor([[153487.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7593e+09, grad_fn=<MseLossBackward>)
output :  tensor([[176709.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(10178792., grad_fn=<MseLossBackward>)
output :  tensor([[121614.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(1241048.2500, grad_fn=<MseLossBackward>)
output :  tensor([[188896.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6043e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145097.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3030e+09, grad_fn=<MseLossBackward>)
output :  tensor([[149378.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(271473.5625, grad_fn=<MseLossBackward>)
output :  tensor([[188934.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1403373.3750, grad_fn=<MseLossBackward>)
output :  tensor([[253201.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5901e+09, grad_fn=<MseLossBackward>)
output :  tensor([[90506.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(986561.0625, grad_fn=<MseLossBackward>)
output :  tensor([[237785.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(4904356.5000, grad_fn=<MseLossBackward>)
output :  tensor([[130579.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(4322371., grad_fn=<MseLossBackward>)
output :  tensor([[165157.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0149e+10, grad_fn=<MseLossBackward>)
output :  tensor([[114640.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1435e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180197.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(17616514., grad_fn=<MseLossBackward>)
output :  tensor([[162907.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5259e+08, grad_fn=<MseLossBackward>)
output :  tensor([[153708.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3864e+08, grad_fn=<MseLossBackward>)
output :  tensor([[240868.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(3492518.5000, grad_fn=<MseLossBackward>)
output :  tensor([[226446.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9563e+08, grad_fn=<MseLossBackward>)
output :  tensor([[123636.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(11314972., grad_fn=<MseLossBackward>)
output :  tensor([[124632.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1870184.5000, grad_fn=<MseLossBackward>)
output :  tensor([[225401.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2555602., grad_fn=<MseLossBackward>)
output :  tensor([[228515.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(30082312., grad_fn=<MseLossBackward>)
output :  tensor([[224489.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(4885067., grad_fn=<MseLossBackward>)
output :  tensor([[147286.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(508391.2812, grad_fn=<MseLossBackward>)
output :  tensor([[208775.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1500012.5000, grad_fn=<MseLossBackward>)
output :  tensor([[130435.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0889e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131984.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(266239.8750, grad_fn=<MseLossBackward>)
output :  tensor([[310125.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(23762882., grad_fn=<MseLossBackward>)
output :  tensor([[134060.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(48153408., grad_fn=<MseLossBackward>)
output :  tensor([[121572.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9782e+09, grad_fn=<MseLossBackward>)
output :  tensor([[109608.4922]], grad_fn=<AddmmBackward>)
loss:  tensor(11770.5547, grad_fn=<MseLossBackward>)
output :  tensor([[155792.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7914e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180625.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8548e+09, grad_fn=<MseLossBackward>)
output :  tensor([[170195.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(7862679., grad_fn=<MseLossBackward>)
output :  tensor([[195252.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(33031960., grad_fn=<MseLossBackward>)
output :  tensor([[95771.1016]], grad_fn=<AddmmBackward>)
loss:  tensor(17883582., grad_fn=<MseLossBackward>)
output :  tensor([[181172.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(4719824., grad_fn=<MseLossBackward>)
output :  tensor([[171409.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(12316590., grad_fn=<MseLossBackward>)
output :  tensor([[137241.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3093971., grad_fn=<MseLossBackward>)
output :  tensor([[264039.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(9.0365e+09, grad_fn=<MseLossBackward>)
output :  tensor([[143943.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4743e+09, grad_fn=<MseLossBackward>)
output :  tensor([[170777.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(4939714.5000, grad_fn=<MseLossBackward>)
output :  tensor([[142401.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(5766301.5000, grad_fn=<MseLossBackward>)
output :  tensor([[202101.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2566053.5000, grad_fn=<MseLossBackward>)
output :  tensor([[169031.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(937145., grad_fn=<MseLossBackward>)
output :  tensor([[244538.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(290116.8750, grad_fn=<MseLossBackward>)
output :  tensor([[135355.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(732174.3750, grad_fn=<MseLossBackward>)
output :  tensor([[150605.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1575534.8750, grad_fn=<MseLossBackward>)
output :  tensor([[213292.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2915289.5000, grad_fn=<MseLossBackward>)
output :  tensor([[161838.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(9996663., grad_fn=<MseLossBackward>)
output :  tensor([[191314.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(5358791., grad_fn=<MseLossBackward>)
output :  tensor([[134461.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0215e+08, grad_fn=<MseLossBackward>)
output :  tensor([[127000.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3996875.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140338.]], grad_fn=<AddmmBackward>)
loss:  tensor(114244., grad_fn=<MseLossBackward>)
output :  tensor([[203929.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2995e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166150.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6164e+09, grad_fn=<MseLossBackward>)
output :  tensor([[73985.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9559e+08, grad_fn=<MseLossBackward>)
output :  tensor([[95576.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2269e+08, grad_fn=<MseLossBackward>)
output :  tensor([[255318.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(4102333.7500, grad_fn=<MseLossBackward>)
output :  tensor([[204135.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2426e+09, grad_fn=<MseLossBackward>)
output :  tensor([[116281.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(1641541.5000, grad_fn=<MseLossBackward>)
output :  tensor([[155884.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9957e+08, grad_fn=<MseLossBackward>)
output :  tensor([[207672.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5197e+08, grad_fn=<MseLossBackward>)
output :  tensor([[183207.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5330e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158690.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(13619675., grad_fn=<MseLossBackward>)
output :  tensor([[170287.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(82782.0781, grad_fn=<MseLossBackward>)
output :  tensor([[112480.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(6345676., grad_fn=<MseLossBackward>)
output :  tensor([[161057.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(36691792., grad_fn=<MseLossBackward>)
output :  tensor([[193024.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9252e+08, grad_fn=<MseLossBackward>)
output :  tensor([[216968.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(6408334., grad_fn=<MseLossBackward>)
output :  tensor([[245826.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4917e+11, grad_fn=<MseLossBackward>)
output :  tensor([[146892.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(11512.6191, grad_fn=<MseLossBackward>)
output :  tensor([[108830.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(123140.6797, grad_fn=<MseLossBackward>)
output :  tensor([[172064.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(96738600., grad_fn=<MseLossBackward>)
output :  tensor([[149427.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1151060.7500, grad_fn=<MseLossBackward>)
output :  tensor([[234223.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(7708518.5000, grad_fn=<MseLossBackward>)
output :  tensor([[112837.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(4676980.5000, grad_fn=<MseLossBackward>)
output :  tensor([[186586.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(13593393., grad_fn=<MseLossBackward>)
output :  tensor([[190111.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(11635347., grad_fn=<MseLossBackward>)
output :  tensor([[163416.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4518e+10, grad_fn=<MseLossBackward>)
output :  tensor([[94803.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9054e+08, grad_fn=<MseLossBackward>)
output :  tensor([[237722.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1631886.5000, grad_fn=<MseLossBackward>)
output :  tensor([[176893.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(798118.8750, grad_fn=<MseLossBackward>)
output :  tensor([[137328.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(7136912., grad_fn=<MseLossBackward>)
output :  tensor([[235202.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(40848.1992, grad_fn=<MseLossBackward>)
output :  tensor([[161591.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1984884.7500, grad_fn=<MseLossBackward>)
output :  tensor([[205626.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4250e+10, grad_fn=<MseLossBackward>)
output :  tensor([[136077.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1161747.1250, grad_fn=<MseLossBackward>)
output :  tensor([[185702.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6180e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137764.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(3113956.5000, grad_fn=<MseLossBackward>)
output :  tensor([[227600.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(70553960., grad_fn=<MseLossBackward>)
output :  tensor([[227208.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1946e+08, grad_fn=<MseLossBackward>)
output :  tensor([[93612.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(13048463., grad_fn=<MseLossBackward>)
output :  tensor([[160053.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(383335.1250, grad_fn=<MseLossBackward>)
output :  tensor([[249301.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4781e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145819.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(672041.3125, grad_fn=<MseLossBackward>)
output :  tensor([[110134.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8606e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163092.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1981628.1250, grad_fn=<MseLossBackward>)
output :  tensor([[140568.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(11773798., grad_fn=<MseLossBackward>)
output :  tensor([[129317.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1249749.3750, grad_fn=<MseLossBackward>)
output :  tensor([[189642.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8105e+09, grad_fn=<MseLossBackward>)
output :  tensor([[122190.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(95969.2656, grad_fn=<MseLossBackward>)
output :  tensor([[148977.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(9133712., grad_fn=<MseLossBackward>)
output :  tensor([[168721.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(9170014., grad_fn=<MseLossBackward>)
output :  tensor([[151508.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(258476.9219, grad_fn=<MseLossBackward>)
output :  tensor([[157178.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(32737708., grad_fn=<MseLossBackward>)
output :  tensor([[137641.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2032e+08, grad_fn=<MseLossBackward>)
output :  tensor([[132735.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(541121.1250, grad_fn=<MseLossBackward>)
output :  tensor([[154371.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3627e+08, grad_fn=<MseLossBackward>)
output :  tensor([[146952.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(7845338.5000, grad_fn=<MseLossBackward>)
output :  tensor([[159921.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(3343126.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135599.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6045e+08, grad_fn=<MseLossBackward>)
output :  tensor([[147897.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(814957.5625, grad_fn=<MseLossBackward>)
output :  tensor([[185442.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(6541365.5000, grad_fn=<MseLossBackward>)
output :  tensor([[169386.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(149720.6250, grad_fn=<MseLossBackward>)
output :  tensor([[180772.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(596708., grad_fn=<MseLossBackward>)
output :  tensor([[222213.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4901519.5000, grad_fn=<MseLossBackward>)
output :  tensor([[107555.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(118422.0156, grad_fn=<MseLossBackward>)
output :  tensor([[137273.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5310e+08, grad_fn=<MseLossBackward>)
output :  tensor([[284289.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2926772.5000, grad_fn=<MseLossBackward>)
output :  tensor([[117528.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2335882.5000, grad_fn=<MseLossBackward>)
output :  tensor([[177950.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7682e+09, grad_fn=<MseLossBackward>)
output :  tensor([[185102.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(10455.0625, grad_fn=<MseLossBackward>)
output :  tensor([[187206.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2912889., grad_fn=<MseLossBackward>)
output :  tensor([[251855.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3566e+08, grad_fn=<MseLossBackward>)
output :  tensor([[222609.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(371166.5312, grad_fn=<MseLossBackward>)
output :  tensor([[122460.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7426e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173398.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1609e+08, grad_fn=<MseLossBackward>)
output :  tensor([[123657.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(117306.2500, grad_fn=<MseLossBackward>)
output :  tensor([[183239.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5301e+10, grad_fn=<MseLossBackward>)
output :  tensor([[151847.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1328364.2500, grad_fn=<MseLossBackward>)
output :  tensor([[153164.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(44415560., grad_fn=<MseLossBackward>)
output :  tensor([[207382.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1170893.1250, grad_fn=<MseLossBackward>)
output :  tensor([[146387.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9287e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174218.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3173297., grad_fn=<MseLossBackward>)
output :  tensor([[250883.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1888e+08, grad_fn=<MseLossBackward>)
output :  tensor([[147211.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(621141., grad_fn=<MseLossBackward>)
output :  tensor([[202847.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(33420.4102, grad_fn=<MseLossBackward>)
output :  tensor([[165768.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(33858216., grad_fn=<MseLossBackward>)
output :  tensor([[124521.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3339e+09, grad_fn=<MseLossBackward>)
output :  tensor([[135061.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(473537.5312, grad_fn=<MseLossBackward>)
output :  tensor([[184555.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(308267.8750, grad_fn=<MseLossBackward>)
output :  tensor([[194812.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(23160156., grad_fn=<MseLossBackward>)
output :  tensor([[227988.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7224e+09, grad_fn=<MseLossBackward>)
output :  tensor([[249617.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(54497152., grad_fn=<MseLossBackward>)
output :  tensor([[188799.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6952e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144834.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8446e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145025.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(276330.9062, grad_fn=<MseLossBackward>)
output :  tensor([[71335.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(9.8190e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128708.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(39578940., grad_fn=<MseLossBackward>)
output :  tensor([[129162.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(68918.5547, grad_fn=<MseLossBackward>)
output :  tensor([[153478.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(271799.3125, grad_fn=<MseLossBackward>)
output :  tensor([[131216.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(17777950., grad_fn=<MseLossBackward>)
output :  tensor([[75801.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(488076.8750, grad_fn=<MseLossBackward>)
output :  tensor([[82352.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(123920.5000, grad_fn=<MseLossBackward>)
output :  tensor([[239982.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(63720804., grad_fn=<MseLossBackward>)
output :  tensor([[140048.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5893e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130653.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(23622.2500, grad_fn=<MseLossBackward>)
output :  tensor([[169078.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(4321721.5000, grad_fn=<MseLossBackward>)
output :  tensor([[233310.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2855730.2500, grad_fn=<MseLossBackward>)
output :  tensor([[187045.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(25956000., grad_fn=<MseLossBackward>)
output :  tensor([[159343.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(11181396., grad_fn=<MseLossBackward>)
output :  tensor([[203370.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(29927054., grad_fn=<MseLossBackward>)
output :  tensor([[204397.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0629e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136561.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(192679.8438, grad_fn=<MseLossBackward>)
output :  tensor([[152854.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(4603505.5000, grad_fn=<MseLossBackward>)
output :  tensor([[134164.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(3368830.7500, grad_fn=<MseLossBackward>)
output :  tensor([[198985.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6191e+08, grad_fn=<MseLossBackward>)
output :  tensor([[155770.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3133840.5000, grad_fn=<MseLossBackward>)
output :  tensor([[137741.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9573e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145181.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(79462.3281, grad_fn=<MseLossBackward>)
output :  tensor([[208164.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(14709862., grad_fn=<MseLossBackward>)
output :  tensor([[99054.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9087e+08, grad_fn=<MseLossBackward>)
output :  tensor([[168254.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(569435.3125, grad_fn=<MseLossBackward>)
output :  tensor([[127290.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(503412.4375, grad_fn=<MseLossBackward>)
output :  tensor([[147496.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(246838.1875, grad_fn=<MseLossBackward>)
output :  tensor([[104746.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7947e+09, grad_fn=<MseLossBackward>)
output :  tensor([[138463.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(927489.3750, grad_fn=<MseLossBackward>)
output :  tensor([[238567.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(6592778.5000, grad_fn=<MseLossBackward>)
output :  tensor([[146710.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2925543., grad_fn=<MseLossBackward>)
output :  tensor([[137975.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(226561.1250, grad_fn=<MseLossBackward>)
output :  tensor([[163989.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2952e+09, grad_fn=<MseLossBackward>)
output :  tensor([[270168.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(61328476., grad_fn=<MseLossBackward>)
output :  tensor([[173958.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1085275.6250, grad_fn=<MseLossBackward>)
output :  tensor([[103211.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(189850.8281, grad_fn=<MseLossBackward>)
output :  tensor([[205245.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2207e+09, grad_fn=<MseLossBackward>)
output :  tensor([[154503.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(20214718., grad_fn=<MseLossBackward>)
output :  tensor([[163527.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5752e+10, grad_fn=<MseLossBackward>)
output :  tensor([[100004.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(2906146., grad_fn=<MseLossBackward>)
output :  tensor([[123569.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(907.9864, grad_fn=<MseLossBackward>)
output :  tensor([[155227.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(596828.6875, grad_fn=<MseLossBackward>)
output :  tensor([[141505.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2266906.7500, grad_fn=<MseLossBackward>)
output :  tensor([[200175.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(30965., grad_fn=<MseLossBackward>)
output :  tensor([[140451.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2397513.5000, grad_fn=<MseLossBackward>)
output :  tensor([[263580.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1692275.7500, grad_fn=<MseLossBackward>)
output :  tensor([[127551.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1938e+09, grad_fn=<MseLossBackward>)
output :  tensor([[162742.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(7604668., grad_fn=<MseLossBackward>)
output :  tensor([[187124.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1892043.2500, grad_fn=<MseLossBackward>)
output :  tensor([[127660.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1190e+08, grad_fn=<MseLossBackward>)
output :  tensor([[249329.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(449884.5938, grad_fn=<MseLossBackward>)
output :  tensor([[158427.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1637e+08, grad_fn=<MseLossBackward>)
output :  tensor([[240916.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(19653706., grad_fn=<MseLossBackward>)
output :  tensor([[145353.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1833104.5000, grad_fn=<MseLossBackward>)
output :  tensor([[208045.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(3818360.2500, grad_fn=<MseLossBackward>)
output :  tensor([[174301.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(3616653., grad_fn=<MseLossBackward>)
output :  tensor([[151933.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4272424.5000, grad_fn=<MseLossBackward>)
output :  tensor([[118170.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(29203.6055, grad_fn=<MseLossBackward>)
output :  tensor([[235470.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6646e+09, grad_fn=<MseLossBackward>)
output :  tensor([[237082.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(8513995., grad_fn=<MseLossBackward>)
output :  tensor([[152041.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1677996.3750, grad_fn=<MseLossBackward>)
output :  tensor([[254047.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(726063.7500, grad_fn=<MseLossBackward>)
output :  tensor([[123802.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(86464136., grad_fn=<MseLossBackward>)
output :  tensor([[176524.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(274625.1250, grad_fn=<MseLossBackward>)
output :  tensor([[159562.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(191679.7812, grad_fn=<MseLossBackward>)
output :  tensor([[136173.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(26760090., grad_fn=<MseLossBackward>)
output :  tensor([[190858.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7649e+09, grad_fn=<MseLossBackward>)
output :  tensor([[162623.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1895526.6250, grad_fn=<MseLossBackward>)
output :  tensor([[161724.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1627936.7500, grad_fn=<MseLossBackward>)
output :  tensor([[156218.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3173742.2500, grad_fn=<MseLossBackward>)
output :  tensor([[152295.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(5737671.5000, grad_fn=<MseLossBackward>)
output :  tensor([[174162.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1812e+09, grad_fn=<MseLossBackward>)
output :  tensor([[160084.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(7087.5352, grad_fn=<MseLossBackward>)
output :  tensor([[379567.]], grad_fn=<AddmmBackward>)
loss:  tensor(19386408., grad_fn=<MseLossBackward>)
output :  tensor([[131899.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(24005406., grad_fn=<MseLossBackward>)
output :  tensor([[129049.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8965e+09, grad_fn=<MseLossBackward>)
output :  tensor([[281998.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(616421.2500, grad_fn=<MseLossBackward>)
output :  tensor([[162994.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(989092.4375, grad_fn=<MseLossBackward>)
output :  tensor([[131511.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2125e+08, grad_fn=<MseLossBackward>)
output :  tensor([[238423.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(41256736., grad_fn=<MseLossBackward>)
output :  tensor([[181683.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1400413.3750, grad_fn=<MseLossBackward>)
output :  tensor([[154451.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(6011308., grad_fn=<MseLossBackward>)
output :  tensor([[145401.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(161327.7500, grad_fn=<MseLossBackward>)
output :  tensor([[153524.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7638e+08, grad_fn=<MseLossBackward>)
output :  tensor([[99292.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(500257.8125, grad_fn=<MseLossBackward>)
output :  tensor([[74347.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0585e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165546.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(298167.1875, grad_fn=<MseLossBackward>)
output :  tensor([[189330.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4953e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161118.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(9725335., grad_fn=<MseLossBackward>)
output :  tensor([[160297.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(7826880.5000, grad_fn=<MseLossBackward>)
output :  tensor([[133856.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(12910435., grad_fn=<MseLossBackward>)
output :  tensor([[205120.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(688251.6875, grad_fn=<MseLossBackward>)
output :  tensor([[139600.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2561050., grad_fn=<MseLossBackward>)
output :  tensor([[182393.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6284e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145750.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(62445.3242, grad_fn=<MseLossBackward>)
output :  tensor([[110148.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3703e+08, grad_fn=<MseLossBackward>)
output :  tensor([[92794.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1454209.8750, grad_fn=<MseLossBackward>)
output :  tensor([[178014.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(9087116., grad_fn=<MseLossBackward>)
output :  tensor([[260712.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(97558.6172, grad_fn=<MseLossBackward>)
output :  tensor([[140148.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1827439.2500, grad_fn=<MseLossBackward>)
output :  tensor([[158281.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2604088.2500, grad_fn=<MseLossBackward>)
output :  tensor([[131423.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1159155., grad_fn=<MseLossBackward>)
output :  tensor([[152219.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(7396955., grad_fn=<MseLossBackward>)
output :  tensor([[172084.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(17513702., grad_fn=<MseLossBackward>)
output :  tensor([[127669.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(448324.4062, grad_fn=<MseLossBackward>)
output :  tensor([[172183.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3896e+08, grad_fn=<MseLossBackward>)
output :  tensor([[156059.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(884922.3750, grad_fn=<MseLossBackward>)
output :  tensor([[115008.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2225504.5000, grad_fn=<MseLossBackward>)
output :  tensor([[159939.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3379e+09, grad_fn=<MseLossBackward>)
output :  tensor([[49747.9492]], grad_fn=<AddmmBackward>)
loss:  tensor(5071732.5000, grad_fn=<MseLossBackward>)
output :  tensor([[233678.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2129e+09, grad_fn=<MseLossBackward>)
output :  tensor([[199531.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2156171., grad_fn=<MseLossBackward>)
output :  tensor([[184356.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(413770.5625, grad_fn=<MseLossBackward>)
output :  tensor([[106463.]], grad_fn=<AddmmBackward>)
loss:  tensor(214369., grad_fn=<MseLossBackward>)
output :  tensor([[90253.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(10582161., grad_fn=<MseLossBackward>)
output :  tensor([[140731.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(534795.1250, grad_fn=<MseLossBackward>)
output :  tensor([[221574.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2455e+09, grad_fn=<MseLossBackward>)
output :  tensor([[205282.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(4919177.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163034.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3863190.2500, grad_fn=<MseLossBackward>)
output :  tensor([[172619.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5342e+09, grad_fn=<MseLossBackward>)
output :  tensor([[190386.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(149164.9219, grad_fn=<MseLossBackward>)
output :  tensor([[89565.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(6583714.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139745.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(64531.8750, grad_fn=<MseLossBackward>)
output :  tensor([[110176.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(104637.0859, grad_fn=<MseLossBackward>)
output :  tensor([[148194.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4967e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173515.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8076e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193602.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2990e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181248.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1559142.3750, grad_fn=<MseLossBackward>)
output :  tensor([[100677.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(17448112., grad_fn=<MseLossBackward>)
output :  tensor([[116713.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(619356.6875, grad_fn=<MseLossBackward>)
output :  tensor([[161174.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2100e+08, grad_fn=<MseLossBackward>)
output :  tensor([[204705.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(22143348., grad_fn=<MseLossBackward>)
output :  tensor([[144218.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(47933.6289, grad_fn=<MseLossBackward>)
train_loss: [2.5733402e+09]
epoch_result tensor([0.])
output :  tensor([[158167.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(110753.7578, grad_fn=<MseLossBackward>)
output :  tensor([[124420.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(5860446.5000, grad_fn=<MseLossBackward>)
output :  tensor([[200926.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(45233820., grad_fn=<MseLossBackward>)
output :  tensor([[177180.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(32467.5352, grad_fn=<MseLossBackward>)
output :  tensor([[151572.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9843e+08, grad_fn=<MseLossBackward>)
output :  tensor([[127752.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(61128.6992, grad_fn=<MseLossBackward>)
output :  tensor([[140525.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(225476.5938, grad_fn=<MseLossBackward>)
output :  tensor([[119081.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(6676.6772, grad_fn=<MseLossBackward>)
output :  tensor([[65979.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(55948412., grad_fn=<MseLossBackward>)
output :  tensor([[166710.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(504388.4688, grad_fn=<MseLossBackward>)
output :  tensor([[135603.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(19325640., grad_fn=<MseLossBackward>)
output :  tensor([[224497.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(252145.2031, grad_fn=<MseLossBackward>)
output :  tensor([[169193.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(37623.8750, grad_fn=<MseLossBackward>)
output :  tensor([[250121.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(178004.8906, grad_fn=<MseLossBackward>)
output :  tensor([[54518.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(232271.2812, grad_fn=<MseLossBackward>)
output :  tensor([[161622.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9318e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173655.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1808814.8750, grad_fn=<MseLossBackward>)
output :  tensor([[167950.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3111e+08, grad_fn=<MseLossBackward>)
output :  tensor([[274395.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(365420.2500, grad_fn=<MseLossBackward>)
output :  tensor([[197706.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(498678.7188, grad_fn=<MseLossBackward>)
output :  tensor([[139899.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4311e+10, grad_fn=<MseLossBackward>)
output :  tensor([[192469.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1988011.8750, grad_fn=<MseLossBackward>)
output :  tensor([[178953.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1110e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151336.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(113368.9922, grad_fn=<MseLossBackward>)
output :  tensor([[170761.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(579239.9375, grad_fn=<MseLossBackward>)
output :  tensor([[89772.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(19116502., grad_fn=<MseLossBackward>)
output :  tensor([[171080.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3733e+09, grad_fn=<MseLossBackward>)
output :  tensor([[185654.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(427859.0625, grad_fn=<MseLossBackward>)
output :  tensor([[207543.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2998e+09, grad_fn=<MseLossBackward>)
output :  tensor([[112156.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(4651402., grad_fn=<MseLossBackward>)
output :  tensor([[173000.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4003751., grad_fn=<MseLossBackward>)
output :  tensor([[137427.]], grad_fn=<AddmmBackward>)
loss:  tensor(859329., grad_fn=<MseLossBackward>)
output :  tensor([[130182.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1397197.8750, grad_fn=<MseLossBackward>)
output :  tensor([[120815.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1730334.7500, grad_fn=<MseLossBackward>)
output :  tensor([[147487.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2946e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165277.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2417e+10, grad_fn=<MseLossBackward>)
output :  tensor([[150011.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(97178.3203, grad_fn=<MseLossBackward>)
output :  tensor([[181711.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2929339.2500, grad_fn=<MseLossBackward>)
output :  tensor([[144548.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(12591630., grad_fn=<MseLossBackward>)
output :  tensor([[106525.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7309e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134453.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4877e+09, grad_fn=<MseLossBackward>)
output :  tensor([[132273.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(7431757.5000, grad_fn=<MseLossBackward>)
output :  tensor([[126745.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(64766.2734, grad_fn=<MseLossBackward>)
output :  tensor([[225346.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(120311.4297, grad_fn=<MseLossBackward>)
output :  tensor([[131807.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(195695.6406, grad_fn=<MseLossBackward>)
output :  tensor([[143588.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(29288560., grad_fn=<MseLossBackward>)
output :  tensor([[115255.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(10601078., grad_fn=<MseLossBackward>)
output :  tensor([[159298.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(491751.5625, grad_fn=<MseLossBackward>)
output :  tensor([[145243.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4758e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194533.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(6417989., grad_fn=<MseLossBackward>)
output :  tensor([[136163.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2934690.2500, grad_fn=<MseLossBackward>)
output :  tensor([[114029.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(16232967., grad_fn=<MseLossBackward>)
output :  tensor([[232734.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1601806.6250, grad_fn=<MseLossBackward>)
output :  tensor([[165914.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2635e+09, grad_fn=<MseLossBackward>)
output :  tensor([[167030.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(64488680., grad_fn=<MseLossBackward>)
output :  tensor([[202304.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8967e+10, grad_fn=<MseLossBackward>)
output :  tensor([[248263.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1180e+10, grad_fn=<MseLossBackward>)
output :  tensor([[141490.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(4037839., grad_fn=<MseLossBackward>)
output :  tensor([[133102.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(805281.8750, grad_fn=<MseLossBackward>)
output :  tensor([[156089.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1187827.5000, grad_fn=<MseLossBackward>)
output :  tensor([[134773.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(22790330., grad_fn=<MseLossBackward>)
output :  tensor([[180179.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3713e+09, grad_fn=<MseLossBackward>)
output :  tensor([[180345.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(14097326., grad_fn=<MseLossBackward>)
output :  tensor([[161092.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(165801.6562, grad_fn=<MseLossBackward>)
output :  tensor([[146232.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(10446935., grad_fn=<MseLossBackward>)
output :  tensor([[143401.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(812927.6250, grad_fn=<MseLossBackward>)
output :  tensor([[142673.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(5411948., grad_fn=<MseLossBackward>)
output :  tensor([[173597.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3677e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193288.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6226e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135215.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1648856.6250, grad_fn=<MseLossBackward>)
output :  tensor([[177089.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(26932694., grad_fn=<MseLossBackward>)
output :  tensor([[178803.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(4826397., grad_fn=<MseLossBackward>)
output :  tensor([[113566.1016]], grad_fn=<AddmmBackward>)
loss:  tensor(2056064.7500, grad_fn=<MseLossBackward>)
output :  tensor([[219303.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2879278.7500, grad_fn=<MseLossBackward>)
output :  tensor([[179455.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(16356716., grad_fn=<MseLossBackward>)
output :  tensor([[127681.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(4757681., grad_fn=<MseLossBackward>)
output :  tensor([[194788.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2927628., grad_fn=<MseLossBackward>)
output :  tensor([[174753.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(21430.2148, grad_fn=<MseLossBackward>)
output :  tensor([[213673.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9783e+10, grad_fn=<MseLossBackward>)
output :  tensor([[208526.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(6116424.5000, grad_fn=<MseLossBackward>)
output :  tensor([[164430.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1176e+09, grad_fn=<MseLossBackward>)
output :  tensor([[191003.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(12228025., grad_fn=<MseLossBackward>)
output :  tensor([[111491.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(2276114.5000, grad_fn=<MseLossBackward>)
output :  tensor([[115582.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(9501132., grad_fn=<MseLossBackward>)
output :  tensor([[108766.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(10453501., grad_fn=<MseLossBackward>)
output :  tensor([[145535.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1600185.5000, grad_fn=<MseLossBackward>)
output :  tensor([[161605.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2775e+10, grad_fn=<MseLossBackward>)
output :  tensor([[178990.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1018333.2500, grad_fn=<MseLossBackward>)
output :  tensor([[127215.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(80784.7422, grad_fn=<MseLossBackward>)
output :  tensor([[143427.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2471970., grad_fn=<MseLossBackward>)
output :  tensor([[180290.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0603e+09, grad_fn=<MseLossBackward>)
output :  tensor([[121672.4922]], grad_fn=<AddmmBackward>)
loss:  tensor(22776682., grad_fn=<MseLossBackward>)
output :  tensor([[194138.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(8185857.5000, grad_fn=<MseLossBackward>)
output :  tensor([[143425.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2478902.7500, grad_fn=<MseLossBackward>)
output :  tensor([[214210.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1717123.6250, grad_fn=<MseLossBackward>)
output :  tensor([[126208.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(43423.3984, grad_fn=<MseLossBackward>)
output :  tensor([[248704.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(141999.4375, grad_fn=<MseLossBackward>)
output :  tensor([[238252.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1853e+09, grad_fn=<MseLossBackward>)
output :  tensor([[147671.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6475e+08, grad_fn=<MseLossBackward>)
output :  tensor([[85675.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0887e+08, grad_fn=<MseLossBackward>)
output :  tensor([[193848.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5693e+09, grad_fn=<MseLossBackward>)
output :  tensor([[80059.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(884966.4375, grad_fn=<MseLossBackward>)
output :  tensor([[138177.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1749667.5000, grad_fn=<MseLossBackward>)
output :  tensor([[79237.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(13969023., grad_fn=<MseLossBackward>)
output :  tensor([[144547.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2542031.7500, grad_fn=<MseLossBackward>)
output :  tensor([[173005.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(8965533., grad_fn=<MseLossBackward>)
output :  tensor([[153074.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(180877.4375, grad_fn=<MseLossBackward>)
output :  tensor([[108735.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(1783455.8750, grad_fn=<MseLossBackward>)
output :  tensor([[205575.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2138e+10, grad_fn=<MseLossBackward>)
output :  tensor([[130345.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(3407023.7500, grad_fn=<MseLossBackward>)
output :  tensor([[270997.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(81046128., grad_fn=<MseLossBackward>)
output :  tensor([[306857.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(9875895., grad_fn=<MseLossBackward>)
output :  tensor([[105573.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3712967.7500, grad_fn=<MseLossBackward>)
output :  tensor([[170452.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(4190401., grad_fn=<MseLossBackward>)
output :  tensor([[134132.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8292e+08, grad_fn=<MseLossBackward>)
output :  tensor([[144501.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(30263064., grad_fn=<MseLossBackward>)
output :  tensor([[128139.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(4453452., grad_fn=<MseLossBackward>)
output :  tensor([[126771.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(3136745.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135600.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8124e+08, grad_fn=<MseLossBackward>)
output :  tensor([[227915.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8058e+10, grad_fn=<MseLossBackward>)
output :  tensor([[193000.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1904e+10, grad_fn=<MseLossBackward>)
output :  tensor([[146940.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(9245020., grad_fn=<MseLossBackward>)
output :  tensor([[130813.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(10978143., grad_fn=<MseLossBackward>)
output :  tensor([[112456.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(1455359.5000, grad_fn=<MseLossBackward>)
output :  tensor([[255880.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8664e+09, grad_fn=<MseLossBackward>)
output :  tensor([[134853.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(21590.6289, grad_fn=<MseLossBackward>)
output :  tensor([[197915.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(25848804., grad_fn=<MseLossBackward>)
output :  tensor([[111501.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(43583720., grad_fn=<MseLossBackward>)
output :  tensor([[141297.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1815629.8750, grad_fn=<MseLossBackward>)
output :  tensor([[207657.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8367e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177009.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(8355622.5000, grad_fn=<MseLossBackward>)
output :  tensor([[186305.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1705064.6250, grad_fn=<MseLossBackward>)
output :  tensor([[163858.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1066e+10, grad_fn=<MseLossBackward>)
output :  tensor([[305169.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8983e+08, grad_fn=<MseLossBackward>)
output :  tensor([[196684.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1476870.5000, grad_fn=<MseLossBackward>)
output :  tensor([[259135.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0657e+10, grad_fn=<MseLossBackward>)
output :  tensor([[222931.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8549e+09, grad_fn=<MseLossBackward>)
output :  tensor([[284437.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0603e+09, grad_fn=<MseLossBackward>)
output :  tensor([[225960.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(3844601.7500, grad_fn=<MseLossBackward>)
output :  tensor([[225361.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7768e+10, grad_fn=<MseLossBackward>)
output :  tensor([[195270.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2992089., grad_fn=<MseLossBackward>)
output :  tensor([[156113.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3515e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137223.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(22315438., grad_fn=<MseLossBackward>)
output :  tensor([[136293.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(628972.9375, grad_fn=<MseLossBackward>)
output :  tensor([[92354.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(1834268.1250, grad_fn=<MseLossBackward>)
output :  tensor([[108997.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(995208.8750, grad_fn=<MseLossBackward>)
output :  tensor([[275158.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8881e+09, grad_fn=<MseLossBackward>)
output :  tensor([[236153.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1329841.3750, grad_fn=<MseLossBackward>)
output :  tensor([[150283.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(27917684., grad_fn=<MseLossBackward>)
output :  tensor([[140734.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(10463608., grad_fn=<MseLossBackward>)
output :  tensor([[174019.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(82225.5625, grad_fn=<MseLossBackward>)
output :  tensor([[144568.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(464740.4688, grad_fn=<MseLossBackward>)
output :  tensor([[166139.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0434e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165693.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(481527.5625, grad_fn=<MseLossBackward>)
output :  tensor([[138047.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1097419.8750, grad_fn=<MseLossBackward>)
output :  tensor([[188402.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3432e+09, grad_fn=<MseLossBackward>)
output :  tensor([[112665.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(442245.7812, grad_fn=<MseLossBackward>)
output :  tensor([[172683.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(467620.9062, grad_fn=<MseLossBackward>)
output :  tensor([[120123.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(15296.6650, grad_fn=<MseLossBackward>)
output :  tensor([[88456.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2120527.5000, grad_fn=<MseLossBackward>)
output :  tensor([[178247.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(3070106.2500, grad_fn=<MseLossBackward>)
output :  tensor([[110877.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(955536.8125, grad_fn=<MseLossBackward>)
output :  tensor([[239019.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(385.1406, grad_fn=<MseLossBackward>)
output :  tensor([[245845.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(715451.6250, grad_fn=<MseLossBackward>)
output :  tensor([[126329.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(10050931., grad_fn=<MseLossBackward>)
output :  tensor([[112698.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(13985438., grad_fn=<MseLossBackward>)
output :  tensor([[289722.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1736e+10, grad_fn=<MseLossBackward>)
output :  tensor([[177436.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(35246856., grad_fn=<MseLossBackward>)
output :  tensor([[122990.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(4038184.5000, grad_fn=<MseLossBackward>)
output :  tensor([[141503.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5240e+08, grad_fn=<MseLossBackward>)
output :  tensor([[202468.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3297e+08, grad_fn=<MseLossBackward>)
output :  tensor([[141385.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(148742.7969, grad_fn=<MseLossBackward>)
output :  tensor([[159872.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4431e+10, grad_fn=<MseLossBackward>)
output :  tensor([[151663.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(5003260.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128445.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(1111426.6250, grad_fn=<MseLossBackward>)
output :  tensor([[250167.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6469e+10, grad_fn=<MseLossBackward>)
output :  tensor([[399533.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(6084393., grad_fn=<MseLossBackward>)
output :  tensor([[107092.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(3639689., grad_fn=<MseLossBackward>)
output :  tensor([[125623.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(50744808., grad_fn=<MseLossBackward>)
output :  tensor([[152864.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(44034216., grad_fn=<MseLossBackward>)
output :  tensor([[129820.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8467e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163474.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4252e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173947.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0893e+09, grad_fn=<MseLossBackward>)
output :  tensor([[103459.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(19716.1094, grad_fn=<MseLossBackward>)
output :  tensor([[139691.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1712990.1250, grad_fn=<MseLossBackward>)
output :  tensor([[365459.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3365505., grad_fn=<MseLossBackward>)
output :  tensor([[206230.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2820e+09, grad_fn=<MseLossBackward>)
output :  tensor([[171541.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(15668114., grad_fn=<MseLossBackward>)
output :  tensor([[200261.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(6963579., grad_fn=<MseLossBackward>)
output :  tensor([[141370.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(5618307.5000, grad_fn=<MseLossBackward>)
output :  tensor([[192429.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(4285805.5000, grad_fn=<MseLossBackward>)
output :  tensor([[134146.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1005e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180369.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(397687.8750, grad_fn=<MseLossBackward>)
output :  tensor([[238763.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(10476753., grad_fn=<MseLossBackward>)
output :  tensor([[171052.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(8687664., grad_fn=<MseLossBackward>)
output :  tensor([[106535.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(2144279.7500, grad_fn=<MseLossBackward>)
output :  tensor([[265751.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1416620.6250, grad_fn=<MseLossBackward>)
output :  tensor([[244447.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(30825746., grad_fn=<MseLossBackward>)
output :  tensor([[125749.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(7558977., grad_fn=<MseLossBackward>)
output :  tensor([[215575.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5313e+09, grad_fn=<MseLossBackward>)
output :  tensor([[308536.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8101e+08, grad_fn=<MseLossBackward>)
output :  tensor([[204308.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(7241901.5000, grad_fn=<MseLossBackward>)
output :  tensor([[215052.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5612e+10, grad_fn=<MseLossBackward>)
output :  tensor([[159136.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1528352.7500, grad_fn=<MseLossBackward>)
output :  tensor([[171873.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(3547925.5000, grad_fn=<MseLossBackward>)
output :  tensor([[161178.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(18035150., grad_fn=<MseLossBackward>)
output :  tensor([[171741.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(3033910.7500, grad_fn=<MseLossBackward>)
output :  tensor([[239826.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9376e+08, grad_fn=<MseLossBackward>)
output :  tensor([[225480.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(15801495., grad_fn=<MseLossBackward>)
output :  tensor([[159378.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5323e+08, grad_fn=<MseLossBackward>)
output :  tensor([[117752.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(27539290., grad_fn=<MseLossBackward>)
output :  tensor([[177850.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(722898.5000, grad_fn=<MseLossBackward>)
output :  tensor([[182992.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9302e+09, grad_fn=<MseLossBackward>)
output :  tensor([[208795.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4530e+10, grad_fn=<MseLossBackward>)
output :  tensor([[135342.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(829494., grad_fn=<MseLossBackward>)
output :  tensor([[148771.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3827e+08, grad_fn=<MseLossBackward>)
output :  tensor([[271998.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(25018440., grad_fn=<MseLossBackward>)
output :  tensor([[89679.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(21902254., grad_fn=<MseLossBackward>)
output :  tensor([[237067.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(321914.3750, grad_fn=<MseLossBackward>)
output :  tensor([[263166.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0225e+11, grad_fn=<MseLossBackward>)
output :  tensor([[167655.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(5496094., grad_fn=<MseLossBackward>)
output :  tensor([[196189.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5063e+09, grad_fn=<MseLossBackward>)
output :  tensor([[153473.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2329868.2500, grad_fn=<MseLossBackward>)
output :  tensor([[205688.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1360e+09, grad_fn=<MseLossBackward>)
output :  tensor([[129659.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(434569.3750, grad_fn=<MseLossBackward>)
output :  tensor([[152952.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(63239524., grad_fn=<MseLossBackward>)
output :  tensor([[167389.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1949e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181382.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(19955206., grad_fn=<MseLossBackward>)
output :  tensor([[127996.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(3985388.2500, grad_fn=<MseLossBackward>)
output :  tensor([[136729.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(52842.5156, grad_fn=<MseLossBackward>)
output :  tensor([[171761.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1535004.8750, grad_fn=<MseLossBackward>)
output :  tensor([[195183.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0048e+09, grad_fn=<MseLossBackward>)
output :  tensor([[239373.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(13154789., grad_fn=<MseLossBackward>)
output :  tensor([[153454.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2387894.2500, grad_fn=<MseLossBackward>)
output :  tensor([[198130.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(4537898.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163274.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7149e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180932.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2052996.3750, grad_fn=<MseLossBackward>)
output :  tensor([[180149.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(62094.4102, grad_fn=<MseLossBackward>)
output :  tensor([[99947.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(8688033., grad_fn=<MseLossBackward>)
output :  tensor([[172121.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1638e+10, grad_fn=<MseLossBackward>)
output :  tensor([[135706.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(499495.5625, grad_fn=<MseLossBackward>)
output :  tensor([[120047.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(25478598., grad_fn=<MseLossBackward>)
output :  tensor([[173154.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(715451.6250, grad_fn=<MseLossBackward>)
output :  tensor([[85198.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(39210.1875, grad_fn=<MseLossBackward>)
output :  tensor([[283954.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(36544668., grad_fn=<MseLossBackward>)
output :  tensor([[167194.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(4814801.5000, grad_fn=<MseLossBackward>)
output :  tensor([[193055.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9631e+10, grad_fn=<MseLossBackward>)
output :  tensor([[246639.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9345e+08, grad_fn=<MseLossBackward>)
output :  tensor([[151841.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(707701.5625, grad_fn=<MseLossBackward>)
output :  tensor([[124808.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(654228.1875, grad_fn=<MseLossBackward>)
output :  tensor([[122172.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(5162552., grad_fn=<MseLossBackward>)
output :  tensor([[144241.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5509e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176828.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(8000235.5000, grad_fn=<MseLossBackward>)
output :  tensor([[110931.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0832e+08, grad_fn=<MseLossBackward>)
output :  tensor([[210368.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1584e+10, grad_fn=<MseLossBackward>)
output :  tensor([[251885.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0787e+08, grad_fn=<MseLossBackward>)
output :  tensor([[252838.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0264e+10, grad_fn=<MseLossBackward>)
output :  tensor([[221049.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2220e+08, grad_fn=<MseLossBackward>)
output :  tensor([[196415.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4181e+10, grad_fn=<MseLossBackward>)
output :  tensor([[186874.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(391172.0625, grad_fn=<MseLossBackward>)
output :  tensor([[206151.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7838e+10, grad_fn=<MseLossBackward>)
output :  tensor([[189467.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1472e+10, grad_fn=<MseLossBackward>)
output :  tensor([[176505.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(4991733.5000, grad_fn=<MseLossBackward>)
output :  tensor([[151701.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(89102.2500, grad_fn=<MseLossBackward>)
output :  tensor([[334728.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(5159854., grad_fn=<MseLossBackward>)
output :  tensor([[206928.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(25718368., grad_fn=<MseLossBackward>)
output :  tensor([[164427.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(19601926., grad_fn=<MseLossBackward>)
output :  tensor([[188855.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7714e+09, grad_fn=<MseLossBackward>)
output :  tensor([[106934.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(3742653., grad_fn=<MseLossBackward>)
output :  tensor([[276259.]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7697e+10, grad_fn=<MseLossBackward>)
output :  tensor([[170618.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(10769678., grad_fn=<MseLossBackward>)
output :  tensor([[207492.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(36088180., grad_fn=<MseLossBackward>)
output :  tensor([[212611.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(70369816., grad_fn=<MseLossBackward>)
output :  tensor([[180031.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(692172., grad_fn=<MseLossBackward>)
output :  tensor([[203675.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(3519024.2500, grad_fn=<MseLossBackward>)
output :  tensor([[153709.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1665712.8750, grad_fn=<MseLossBackward>)
output :  tensor([[147882.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2927e+09, grad_fn=<MseLossBackward>)
output :  tensor([[118535.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1251.3906, grad_fn=<MseLossBackward>)
output :  tensor([[139058.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(886392.8125, grad_fn=<MseLossBackward>)
output :  tensor([[149739.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(546698.5000, grad_fn=<MseLossBackward>)
output :  tensor([[200918.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6150e+10, grad_fn=<MseLossBackward>)
output :  tensor([[159286.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(45642.3164, grad_fn=<MseLossBackward>)
output :  tensor([[100049.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(301701.3125, grad_fn=<MseLossBackward>)
output :  tensor([[224937.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2687e+08, grad_fn=<MseLossBackward>)
output :  tensor([[184767.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7123e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174521.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(3854412., grad_fn=<MseLossBackward>)
output :  tensor([[81449.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(303497.6875, grad_fn=<MseLossBackward>)
output :  tensor([[130097.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2551008., grad_fn=<MseLossBackward>)
output :  tensor([[215024.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1050048.5000, grad_fn=<MseLossBackward>)
output :  tensor([[143375.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(390507.8125, grad_fn=<MseLossBackward>)
output :  tensor([[136651.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(44245572., grad_fn=<MseLossBackward>)
output :  tensor([[140648.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(3807376.5000, grad_fn=<MseLossBackward>)
output :  tensor([[176372.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5111e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146291.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(5250829., grad_fn=<MseLossBackward>)
output :  tensor([[161661.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2761309.2500, grad_fn=<MseLossBackward>)
output :  tensor([[213421.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2491119.7500, grad_fn=<MseLossBackward>)
output :  tensor([[136346.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(9.8263e+08, grad_fn=<MseLossBackward>)
output :  tensor([[254101.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(806825., grad_fn=<MseLossBackward>)
output :  tensor([[161318.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(3306203.5000, grad_fn=<MseLossBackward>)
output :  tensor([[126680.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(3310722.5000, grad_fn=<MseLossBackward>)
output :  tensor([[97518.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(6345046., grad_fn=<MseLossBackward>)
output :  tensor([[155282.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0102e+09, grad_fn=<MseLossBackward>)
output :  tensor([[176853.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(9280686., grad_fn=<MseLossBackward>)
output :  tensor([[120852.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(124366.4297, grad_fn=<MseLossBackward>)
output :  tensor([[188840.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6088e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145360.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3376e+09, grad_fn=<MseLossBackward>)
output :  tensor([[153771.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(14985488., grad_fn=<MseLossBackward>)
output :  tensor([[188735.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(970963.8750, grad_fn=<MseLossBackward>)
output :  tensor([[253846.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5390e+09, grad_fn=<MseLossBackward>)
output :  tensor([[89704.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(3224858.2500, grad_fn=<MseLossBackward>)
output :  tensor([[239618.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(145327.7344, grad_fn=<MseLossBackward>)
output :  tensor([[126154.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(5503532.5000, grad_fn=<MseLossBackward>)
output :  tensor([[165125.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0156e+10, grad_fn=<MseLossBackward>)
output :  tensor([[114359.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0619e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178842.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(8079717.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163637.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8746e+08, grad_fn=<MseLossBackward>)
output :  tensor([[154301.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6653e+08, grad_fn=<MseLossBackward>)
output :  tensor([[235165.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(14706865., grad_fn=<MseLossBackward>)
output :  tensor([[225387.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0636e+09, grad_fn=<MseLossBackward>)
output :  tensor([[124962.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(4151915.7500, grad_fn=<MseLossBackward>)
output :  tensor([[131691.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(32390860., grad_fn=<MseLossBackward>)
output :  tensor([[224046.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(8723901., grad_fn=<MseLossBackward>)
output :  tensor([[231070.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(8581696., grad_fn=<MseLossBackward>)
output :  tensor([[229500.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(7843675.5000, grad_fn=<MseLossBackward>)
output :  tensor([[148119.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(14198.2119, grad_fn=<MseLossBackward>)
output :  tensor([[208841.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1342774., grad_fn=<MseLossBackward>)
output :  tensor([[127901.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(62439628., grad_fn=<MseLossBackward>)
output :  tensor([[136877.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(19159770., grad_fn=<MseLossBackward>)
output :  tensor([[309354.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(31874140., grad_fn=<MseLossBackward>)
output :  tensor([[141411.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(169075.1562, grad_fn=<MseLossBackward>)
output :  tensor([[120527.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8652e+09, grad_fn=<MseLossBackward>)
output :  tensor([[108657.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(710306.5625, grad_fn=<MseLossBackward>)
output :  tensor([[157367.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2899e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181651.]], grad_fn=<AddmmBackward>)
loss:  tensor(8.6628e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174299.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1687441.6250, grad_fn=<MseLossBackward>)
output :  tensor([[193164.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(61390652., grad_fn=<MseLossBackward>)
output :  tensor([[104400.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(19365500., grad_fn=<MseLossBackward>)
output :  tensor([[177566.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2056221.6250, grad_fn=<MseLossBackward>)
output :  tensor([[167965.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(4243.3008, grad_fn=<MseLossBackward>)
output :  tensor([[142228.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(10426239., grad_fn=<MseLossBackward>)
output :  tensor([[263026.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2302e+09, grad_fn=<MseLossBackward>)
output :  tensor([[142726.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3323e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174349.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1822457.8750, grad_fn=<MseLossBackward>)
output :  tensor([[139381.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(382329.6562, grad_fn=<MseLossBackward>)
output :  tensor([[200545.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2088.7756, grad_fn=<MseLossBackward>)
output :  tensor([[169476.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(274395.9062, grad_fn=<MseLossBackward>)
output :  tensor([[242865.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1287551.1250, grad_fn=<MseLossBackward>)
output :  tensor([[133033.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2150026.5000, grad_fn=<MseLossBackward>)
output :  tensor([[150323.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(947154.7500, grad_fn=<MseLossBackward>)
output :  tensor([[213799.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1440150., grad_fn=<MseLossBackward>)
output :  tensor([[170087.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(25883134., grad_fn=<MseLossBackward>)
output :  tensor([[191701.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(7299200., grad_fn=<MseLossBackward>)
output :  tensor([[131443.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5938e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128778.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(49041.4883, grad_fn=<MseLossBackward>)
output :  tensor([[145228.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(27333618., grad_fn=<MseLossBackward>)
output :  tensor([[200902.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7056e+09, grad_fn=<MseLossBackward>)
output :  tensor([[167503.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7566e+09, grad_fn=<MseLossBackward>)
output :  tensor([[72995.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6889e+08, grad_fn=<MseLossBackward>)
output :  tensor([[90755.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(39133332., grad_fn=<MseLossBackward>)
output :  tensor([[249119.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(17414060., grad_fn=<MseLossBackward>)
output :  tensor([[203056.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1033e+09, grad_fn=<MseLossBackward>)
output :  tensor([[115616.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(380081.8750, grad_fn=<MseLossBackward>)
output :  tensor([[158234.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5647e+08, grad_fn=<MseLossBackward>)
output :  tensor([[209070.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1945e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181160.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8925e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158887.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(15112535., grad_fn=<MseLossBackward>)
output :  tensor([[166901.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(9598572., grad_fn=<MseLossBackward>)
output :  tensor([[115494.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(244151.7969, grad_fn=<MseLossBackward>)
output :  tensor([[158497.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(12234036., grad_fn=<MseLossBackward>)
output :  tensor([[192241.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1486e+08, grad_fn=<MseLossBackward>)
output :  tensor([[222982.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(12129439., grad_fn=<MseLossBackward>)
output :  tensor([[247278.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4773e+11, grad_fn=<MseLossBackward>)
output :  tensor([[150113.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(9693980., grad_fn=<MseLossBackward>)
output :  tensor([[110290.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(3276722.2500, grad_fn=<MseLossBackward>)
output :  tensor([[169520.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5325e+08, grad_fn=<MseLossBackward>)
output :  tensor([[154463.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(15706360., grad_fn=<MseLossBackward>)
output :  tensor([[237469.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(220488.9375, grad_fn=<MseLossBackward>)
output :  tensor([[114180.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(671426.6250, grad_fn=<MseLossBackward>)
output :  tensor([[177379.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(30474196., grad_fn=<MseLossBackward>)
output :  tensor([[186748.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2384.1858, grad_fn=<MseLossBackward>)
output :  tensor([[164434.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4201e+10, grad_fn=<MseLossBackward>)
output :  tensor([[93801.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6388e+08, grad_fn=<MseLossBackward>)
output :  tensor([[243497.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(20225538., grad_fn=<MseLossBackward>)
output :  tensor([[178801.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(7848402., grad_fn=<MseLossBackward>)
output :  tensor([[140541.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(292765.5312, grad_fn=<MseLossBackward>)
output :  tensor([[231066.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(15473037., grad_fn=<MseLossBackward>)
output :  tensor([[161642.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1844036.7500, grad_fn=<MseLossBackward>)
output :  tensor([[204397.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4545e+10, grad_fn=<MseLossBackward>)
output :  tensor([[135406.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(165242.2500, grad_fn=<MseLossBackward>)
output :  tensor([[185707.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6204e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134786.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1472544.3750, grad_fn=<MseLossBackward>)
output :  tensor([[229446.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(42951024., grad_fn=<MseLossBackward>)
output :  tensor([[226539.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5039e+08, grad_fn=<MseLossBackward>)
output :  tensor([[93031.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(9191129., grad_fn=<MseLossBackward>)
output :  tensor([[161878.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(5977337.5000, grad_fn=<MseLossBackward>)
output :  tensor([[249311.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4778e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145811.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(659090.2500, grad_fn=<MseLossBackward>)
output :  tensor([[110043.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8528e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164823.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(104783.7109, grad_fn=<MseLossBackward>)
output :  tensor([[147647.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(13304028., grad_fn=<MseLossBackward>)
output :  tensor([[129932.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3001664.5000, grad_fn=<MseLossBackward>)
output :  tensor([[189891.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7759e+09, grad_fn=<MseLossBackward>)
output :  tensor([[123938.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2068203.5000, grad_fn=<MseLossBackward>)
output :  tensor([[152713.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(509193.7500, grad_fn=<MseLossBackward>)
output :  tensor([[170177.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2473837.5000, grad_fn=<MseLossBackward>)
output :  tensor([[148820.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(4752264., grad_fn=<MseLossBackward>)
output :  tensor([[161334.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2451034.7500, grad_fn=<MseLossBackward>)
output :  tensor([[136649.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6448e+08, grad_fn=<MseLossBackward>)
output :  tensor([[132308.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(95345.8594, grad_fn=<MseLossBackward>)
output :  tensor([[154272.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3326e+08, grad_fn=<MseLossBackward>)
output :  tensor([[142782.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1875273.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162865.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1243817.3750, grad_fn=<MseLossBackward>)
output :  tensor([[135799.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7078e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148965.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(27493.7852, grad_fn=<MseLossBackward>)
output :  tensor([[185420.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(6654787.5000, grad_fn=<MseLossBackward>)
output :  tensor([[168662.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(113737.5625, grad_fn=<MseLossBackward>)
output :  tensor([[179882.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(13787.8965, grad_fn=<MseLossBackward>)
output :  tensor([[221825.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3332906.7500, grad_fn=<MseLossBackward>)
output :  tensor([[109754.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(3437808.5000, grad_fn=<MseLossBackward>)
output :  tensor([[136852.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4286e+08, grad_fn=<MseLossBackward>)
output :  tensor([[288308.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(5327441., grad_fn=<MseLossBackward>)
output :  tensor([[118727.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(7441558., grad_fn=<MseLossBackward>)
output :  tensor([[176491.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8930e+09, grad_fn=<MseLossBackward>)
output :  tensor([[182752.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(5053434., grad_fn=<MseLossBackward>)
output :  tensor([[180546.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(24534686., grad_fn=<MseLossBackward>)
output :  tensor([[249339.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5844e+08, grad_fn=<MseLossBackward>)
output :  tensor([[222244.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(59658.0625, grad_fn=<MseLossBackward>)
output :  tensor([[123129.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9686e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173942.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3860e+08, grad_fn=<MseLossBackward>)
output :  tensor([[124604.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(364957.5625, grad_fn=<MseLossBackward>)
output :  tensor([[183787.]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5021e+10, grad_fn=<MseLossBackward>)
output :  tensor([[150962.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(4151852., grad_fn=<MseLossBackward>)
output :  tensor([[155068.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(73424816., grad_fn=<MseLossBackward>)
output :  tensor([[201022.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(27851016., grad_fn=<MseLossBackward>)
output :  tensor([[145424.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6704e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175090.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(826479.8750, grad_fn=<MseLossBackward>)
output :  tensor([[250891.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1847e+08, grad_fn=<MseLossBackward>)
output :  tensor([[149822.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(3321278.5000, grad_fn=<MseLossBackward>)
output :  tensor([[205104.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(5951922.5000, grad_fn=<MseLossBackward>)
output :  tensor([[164218.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(18216224., grad_fn=<MseLossBackward>)
output :  tensor([[120797.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0757e+09, grad_fn=<MseLossBackward>)
output :  tensor([[135490.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(67105.2812, grad_fn=<MseLossBackward>)
output :  tensor([[178610.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(29043006., grad_fn=<MseLossBackward>)
output :  tensor([[198290.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(68736016., grad_fn=<MseLossBackward>)
output :  tensor([[232816.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1566e+09, grad_fn=<MseLossBackward>)
output :  tensor([[256343.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(430623.0625, grad_fn=<MseLossBackward>)
output :  tensor([[188616.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7000e+10, grad_fn=<MseLossBackward>)
output :  tensor([[141689.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5189e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145684.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1403595.5000, grad_fn=<MseLossBackward>)
output :  tensor([[69931.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(8.9588e+08, grad_fn=<MseLossBackward>)
output :  tensor([[138676.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(13516652., grad_fn=<MseLossBackward>)
output :  tensor([[127723.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(1383582.5000, grad_fn=<MseLossBackward>)
output :  tensor([[157767.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(14195587., grad_fn=<MseLossBackward>)
output :  tensor([[129688.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(7226100., grad_fn=<MseLossBackward>)
output :  tensor([[79252.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(7577675.5000, grad_fn=<MseLossBackward>)
output :  tensor([[83949.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(3799849.7500, grad_fn=<MseLossBackward>)
output :  tensor([[227700.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(18484222., grad_fn=<MseLossBackward>)
output :  tensor([[141417.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3621e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129500.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(998453.7500, grad_fn=<MseLossBackward>)
output :  tensor([[166557.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(196165.9531, grad_fn=<MseLossBackward>)
output :  tensor([[232987.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(4049653.2500, grad_fn=<MseLossBackward>)
output :  tensor([[189479.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(7077013., grad_fn=<MseLossBackward>)
output :  tensor([[155798.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(40709.3672, grad_fn=<MseLossBackward>)
output :  tensor([[196932.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(936812.2500, grad_fn=<MseLossBackward>)
output :  tensor([[203948.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0924e+09, grad_fn=<MseLossBackward>)
output :  tensor([[139068.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(4278951., grad_fn=<MseLossBackward>)
output :  tensor([[153782.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1482458.5000, grad_fn=<MseLossBackward>)
output :  tensor([[136224.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(50246.0234, grad_fn=<MseLossBackward>)
output :  tensor([[199943.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(9.0340e+08, grad_fn=<MseLossBackward>)
output :  tensor([[152746.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1570792.2500, grad_fn=<MseLossBackward>)
output :  tensor([[135561.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7691e+09, grad_fn=<MseLossBackward>)
output :  tensor([[143700.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1438200.5000, grad_fn=<MseLossBackward>)
output :  tensor([[209570.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(5904216.5000, grad_fn=<MseLossBackward>)
output :  tensor([[99879.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1966e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163045.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(19845216., grad_fn=<MseLossBackward>)
output :  tensor([[131614.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(13063368., grad_fn=<MseLossBackward>)
output :  tensor([[144962.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(4150324., grad_fn=<MseLossBackward>)
output :  tensor([[102023.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5714e+09, grad_fn=<MseLossBackward>)
output :  tensor([[138273.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(597963.8750, grad_fn=<MseLossBackward>)
output :  tensor([[235171.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(687085.5625, grad_fn=<MseLossBackward>)
output :  tensor([[144627.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(138686.4219, grad_fn=<MseLossBackward>)
output :  tensor([[138538.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1079228.7500, grad_fn=<MseLossBackward>)
output :  tensor([[164713.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3479e+09, grad_fn=<MseLossBackward>)
output :  tensor([[274761.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(10487073., grad_fn=<MseLossBackward>)
output :  tensor([[177453.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(6020429., grad_fn=<MseLossBackward>)
output :  tensor([[102011.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(585045.6875, grad_fn=<MseLossBackward>)
output :  tensor([[204128.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3833e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159557.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(311154.7812, grad_fn=<MseLossBackward>)
output :  tensor([[163270.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5862e+10, grad_fn=<MseLossBackward>)
output :  tensor([[99323.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(1047600.2500, grad_fn=<MseLossBackward>)
output :  tensor([[125949.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(5521325., grad_fn=<MseLossBackward>)
output :  tensor([[162492.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(42147280., grad_fn=<MseLossBackward>)
output :  tensor([[142019.]], grad_fn=<AddmmBackward>)
loss:  tensor(4076361., grad_fn=<MseLossBackward>)
output :  tensor([[198904.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1200359.8750, grad_fn=<MseLossBackward>)
output :  tensor([[145347.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(11203978., grad_fn=<MseLossBackward>)
output :  tensor([[261575.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(496386.3125, grad_fn=<MseLossBackward>)
output :  tensor([[128157.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2360e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164862.]], grad_fn=<AddmmBackward>)
loss:  tensor(407044., grad_fn=<MseLossBackward>)
output :  tensor([[189740.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1539848.3750, grad_fn=<MseLossBackward>)
output :  tensor([[125402.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3722e+08, grad_fn=<MseLossBackward>)
output :  tensor([[257878.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(62071748., grad_fn=<MseLossBackward>)
output :  tensor([[158843.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9281e+08, grad_fn=<MseLossBackward>)
output :  tensor([[244375.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(950107.1250, grad_fn=<MseLossBackward>)
output :  tensor([[142911.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1185784.8750, grad_fn=<MseLossBackward>)
output :  tensor([[211530.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2343769.7500, grad_fn=<MseLossBackward>)
output :  tensor([[175825.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(11734478., grad_fn=<MseLossBackward>)
output :  tensor([[153757.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(58828.9883, grad_fn=<MseLossBackward>)
output :  tensor([[119931.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(3729485.2500, grad_fn=<MseLossBackward>)
output :  tensor([[239476.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2670e+09, grad_fn=<MseLossBackward>)
output :  tensor([[239876.]], grad_fn=<AddmmBackward>)
loss:  tensor(15376., grad_fn=<MseLossBackward>)
output :  tensor([[150659.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(7170512.5000, grad_fn=<MseLossBackward>)
output :  tensor([[255302.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(162346.0312, grad_fn=<MseLossBackward>)
output :  tensor([[124144.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(92941048., grad_fn=<MseLossBackward>)
output :  tensor([[175461.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(289595.3438, grad_fn=<MseLossBackward>)
output :  tensor([[158493.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2270719.2500, grad_fn=<MseLossBackward>)
output :  tensor([[132952.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(3811280., grad_fn=<MseLossBackward>)
output :  tensor([[194472.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2214e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163433.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(321170.1562, grad_fn=<MseLossBackward>)
output :  tensor([[166940.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(15526555., grad_fn=<MseLossBackward>)
output :  tensor([[157934.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(4308.6914, grad_fn=<MseLossBackward>)
output :  tensor([[142553.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(53975196., grad_fn=<MseLossBackward>)
output :  tensor([[171192.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8060e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158917.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1171704.7500, grad_fn=<MseLossBackward>)
output :  tensor([[381564.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(5785528., grad_fn=<MseLossBackward>)
output :  tensor([[122463.1016]], grad_fn=<AddmmBackward>)
loss:  tensor(20583448., grad_fn=<MseLossBackward>)
output :  tensor([[131006.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0708e+09, grad_fn=<MseLossBackward>)
output :  tensor([[276558.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(21668734., grad_fn=<MseLossBackward>)
output :  tensor([[161606.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(155162.1406, grad_fn=<MseLossBackward>)
output :  tensor([[131129.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1298e+08, grad_fn=<MseLossBackward>)
output :  tensor([[226872.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(26289014., grad_fn=<MseLossBackward>)
output :  tensor([[181276.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(602782.3750, grad_fn=<MseLossBackward>)
output :  tensor([[153578.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2491070.2500, grad_fn=<MseLossBackward>)
output :  tensor([[144629.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(137015.6562, grad_fn=<MseLossBackward>)
output :  tensor([[155275.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3766e+08, grad_fn=<MseLossBackward>)
output :  tensor([[101643.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2701708.5000, grad_fn=<MseLossBackward>)
output :  tensor([[73745.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8894e+08, grad_fn=<MseLossBackward>)
output :  tensor([[164922.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(6064.5156, grad_fn=<MseLossBackward>)
output :  tensor([[188502.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5601e+09, grad_fn=<MseLossBackward>)
output :  tensor([[160020.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(4080652.5000, grad_fn=<MseLossBackward>)
output :  tensor([[161069.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(12744565., grad_fn=<MseLossBackward>)
output :  tensor([[138263.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(662468.8125, grad_fn=<MseLossBackward>)
output :  tensor([[210305.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(18967658., grad_fn=<MseLossBackward>)
output :  tensor([[140354.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(5542199., grad_fn=<MseLossBackward>)
output :  tensor([[183526.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5995e+10, grad_fn=<MseLossBackward>)
output :  tensor([[148807.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(7883986.5000, grad_fn=<MseLossBackward>)
output :  tensor([[109664.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1097e+08, grad_fn=<MseLossBackward>)
output :  tensor([[95725.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2976325.7500, grad_fn=<MseLossBackward>)
output :  tensor([[176515.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2296361.5000, grad_fn=<MseLossBackward>)
output :  tensor([[258399.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(4001375., grad_fn=<MseLossBackward>)
output :  tensor([[139916.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2507274.2500, grad_fn=<MseLossBackward>)
output :  tensor([[157745.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(4621156.5000, grad_fn=<MseLossBackward>)
output :  tensor([[133612.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1237204.3750, grad_fn=<MseLossBackward>)
output :  tensor([[148763.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(542777.5625, grad_fn=<MseLossBackward>)
output :  tensor([[167440.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(211513.7656, grad_fn=<MseLossBackward>)
output :  tensor([[128416.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(2007601.1250, grad_fn=<MseLossBackward>)
output :  tensor([[170922.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7195e+08, grad_fn=<MseLossBackward>)
output :  tensor([[160339.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(11149338., grad_fn=<MseLossBackward>)
output :  tensor([[122469.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(35638568., grad_fn=<MseLossBackward>)
output :  tensor([[158988.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4777e+09, grad_fn=<MseLossBackward>)
output :  tensor([[53229.2539]], grad_fn=<AddmmBackward>)
loss:  tensor(1511065.1250, grad_fn=<MseLossBackward>)
output :  tensor([[234294.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1161e+09, grad_fn=<MseLossBackward>)
output :  tensor([[200172.]], grad_fn=<AddmmBackward>)
loss:  tensor(685584., grad_fn=<MseLossBackward>)
output :  tensor([[185661.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(437913.0625, grad_fn=<MseLossBackward>)
output :  tensor([[106638.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(407053.9688, grad_fn=<MseLossBackward>)
output :  tensor([[88076.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1158011.3750, grad_fn=<MseLossBackward>)
output :  tensor([[144541.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(20625790., grad_fn=<MseLossBackward>)
output :  tensor([[223269.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0029e+09, grad_fn=<MseLossBackward>)
output :  tensor([[206853.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(418386.6250, grad_fn=<MseLossBackward>)
output :  tensor([[170968.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(35619448., grad_fn=<MseLossBackward>)
output :  tensor([[175860.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9459e+09, grad_fn=<MseLossBackward>)
output :  tensor([[188906.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1195434.7500, grad_fn=<MseLossBackward>)
output :  tensor([[88646.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2711116.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140826.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(683360.5625, grad_fn=<MseLossBackward>)
output :  tensor([[114579.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(16645125., grad_fn=<MseLossBackward>)
output :  tensor([[149480.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8279e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172962.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7609e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195932.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(82214736., grad_fn=<MseLossBackward>)
output :  tensor([[177265.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(7478174., grad_fn=<MseLossBackward>)
output :  tensor([[96353.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(21320.5625, grad_fn=<MseLossBackward>)
output :  tensor([[119873.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(5632612., grad_fn=<MseLossBackward>)
output :  tensor([[162442.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6471e+08, grad_fn=<MseLossBackward>)
output :  tensor([[198568.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2049326.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144729.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(532101.8750, grad_fn=<MseLossBackward>)
train_loss: [2.5619325e+09]
epoch_result tensor([0.])
output :  tensor([[158656.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(24639.1875, grad_fn=<MseLossBackward>)
output :  tensor([[123053.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1108973.5000, grad_fn=<MseLossBackward>)
output :  tensor([[196231.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(4121534.5000, grad_fn=<MseLossBackward>)
output :  tensor([[176890.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(11952.6387, grad_fn=<MseLossBackward>)
output :  tensor([[152504.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5004e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128769.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(591445.1250, grad_fn=<MseLossBackward>)
output :  tensor([[142189.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1415430.7500, grad_fn=<MseLossBackward>)
output :  tensor([[119761.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(579251.8125, grad_fn=<MseLossBackward>)
output :  tensor([[65821.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(53604020., grad_fn=<MseLossBackward>)
output :  tensor([[165894.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(11123.6572, grad_fn=<MseLossBackward>)
output :  tensor([[141530.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2341617.2500, grad_fn=<MseLossBackward>)
output :  tensor([[225197.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(39098.8828, grad_fn=<MseLossBackward>)
output :  tensor([[169473.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(224261.4375, grad_fn=<MseLossBackward>)
output :  tensor([[246476.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(10392766., grad_fn=<MseLossBackward>)
output :  tensor([[55010.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(102.1995, grad_fn=<MseLossBackward>)
output :  tensor([[161358.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8420e+08, grad_fn=<MseLossBackward>)
output :  tensor([[185005.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0011e+08, grad_fn=<MseLossBackward>)
output :  tensor([[162834.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(40131632., grad_fn=<MseLossBackward>)
output :  tensor([[274698.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(90902.2500, grad_fn=<MseLossBackward>)
output :  tensor([[193569.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(11768437., grad_fn=<MseLossBackward>)
output :  tensor([[139305.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4635e+10, grad_fn=<MseLossBackward>)
output :  tensor([[196779.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(8410725., grad_fn=<MseLossBackward>)
output :  tensor([[180786.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9460e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151734.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(540018.3125, grad_fn=<MseLossBackward>)
output :  tensor([[168006.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3973419.2500, grad_fn=<MseLossBackward>)
output :  tensor([[86464.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(1132877.5000, grad_fn=<MseLossBackward>)
output :  tensor([[171640.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4387e+09, grad_fn=<MseLossBackward>)
output :  tensor([[181577.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(11713399., grad_fn=<MseLossBackward>)
output :  tensor([[207682.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2865e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113444.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(11865388., grad_fn=<MseLossBackward>)
output :  tensor([[171457.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(208948.9844, grad_fn=<MseLossBackward>)
output :  tensor([[135891.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(369778., grad_fn=<MseLossBackward>)
output :  tensor([[129252.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(63665.5391, grad_fn=<MseLossBackward>)
output :  tensor([[119309.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(36439.2305, grad_fn=<MseLossBackward>)
output :  tensor([[147136.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(9.0818e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166861.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1945e+10, grad_fn=<MseLossBackward>)
output :  tensor([[152699.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(8995501., grad_fn=<MseLossBackward>)
output :  tensor([[183015.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(9094088., grad_fn=<MseLossBackward>)
output :  tensor([[140736.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(69506.3828, grad_fn=<MseLossBackward>)
output :  tensor([[104760.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1787e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135906.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2558e+09, grad_fn=<MseLossBackward>)
output :  tensor([[138250.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(10566563., grad_fn=<MseLossBackward>)
output :  tensor([[134370.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(54320356., grad_fn=<MseLossBackward>)
output :  tensor([[224867.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(17452.8867, grad_fn=<MseLossBackward>)
output :  tensor([[133012.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(581763.7500, grad_fn=<MseLossBackward>)
output :  tensor([[146933.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(4271262., grad_fn=<MseLossBackward>)
output :  tensor([[113474.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2175072., grad_fn=<MseLossBackward>)
output :  tensor([[161238.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1533843.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145687.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4317e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192576.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(332172.1250, grad_fn=<MseLossBackward>)
output :  tensor([[135078.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(395090.8125, grad_fn=<MseLossBackward>)
output :  tensor([[105473.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(20485666., grad_fn=<MseLossBackward>)
output :  tensor([[233808.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(36774.0547, grad_fn=<MseLossBackward>)
output :  tensor([[167016.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1598e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158915.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(7129.6914, grad_fn=<MseLossBackward>)
output :  tensor([[202832.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8787e+10, grad_fn=<MseLossBackward>)
output :  tensor([[249178.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0987e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145060.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2434575., grad_fn=<MseLossBackward>)
output :  tensor([[136700.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(7290422., grad_fn=<MseLossBackward>)
output :  tensor([[150526.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(20009126., grad_fn=<MseLossBackward>)
output :  tensor([[133733.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(13937156., grad_fn=<MseLossBackward>)
output :  tensor([[179922.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4124e+09, grad_fn=<MseLossBackward>)
output :  tensor([[181597.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(6264852.5000, grad_fn=<MseLossBackward>)
output :  tensor([[171004.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(90338488., grad_fn=<MseLossBackward>)
output :  tensor([[135226.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(60421228., grad_fn=<MseLossBackward>)
output :  tensor([[141786.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(508970.7812, grad_fn=<MseLossBackward>)
output :  tensor([[149175.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(17431538., grad_fn=<MseLossBackward>)
output :  tensor([[174485.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2511e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194931.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8701e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136351.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(21987.3281, grad_fn=<MseLossBackward>)
output :  tensor([[171577.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(103834.9922, grad_fn=<MseLossBackward>)
output :  tensor([[175916.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(25842290., grad_fn=<MseLossBackward>)
output :  tensor([[119244.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(18014918., grad_fn=<MseLossBackward>)
output :  tensor([[220284.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(511292.0312, grad_fn=<MseLossBackward>)
output :  tensor([[183318.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(33089.8828, grad_fn=<MseLossBackward>)
output :  tensor([[124477.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(1044819.3750, grad_fn=<MseLossBackward>)
output :  tensor([[198359.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(3456752.5000, grad_fn=<MseLossBackward>)
output :  tensor([[175215.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(99727.6641, grad_fn=<MseLossBackward>)
output :  tensor([[209182.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1353e+10, grad_fn=<MseLossBackward>)
output :  tensor([[212136.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1292413.7500, grad_fn=<MseLossBackward>)
output :  tensor([[164727.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1376e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193880.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(384012.5938, grad_fn=<MseLossBackward>)
output :  tensor([[114587.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2519213.7500, grad_fn=<MseLossBackward>)
output :  tensor([[114660.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(4668536.5000, grad_fn=<MseLossBackward>)
output :  tensor([[113436.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2064744.5000, grad_fn=<MseLossBackward>)
output :  tensor([[147096.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(87977.1250, grad_fn=<MseLossBackward>)
output :  tensor([[159288.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3619e+10, grad_fn=<MseLossBackward>)
output :  tensor([[179349.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(423719.6250, grad_fn=<MseLossBackward>)
output :  tensor([[127031.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(219917.0312, grad_fn=<MseLossBackward>)
output :  tensor([[144726.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(74776.6094, grad_fn=<MseLossBackward>)
output :  tensor([[186551.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6679e+09, grad_fn=<MseLossBackward>)
output :  tensor([[118982.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(4337977.5000, grad_fn=<MseLossBackward>)
output :  tensor([[198740.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(3027872., grad_fn=<MseLossBackward>)
output :  tensor([[146168.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1366268.7500, grad_fn=<MseLossBackward>)
output :  tensor([[211306.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2538395.7500, grad_fn=<MseLossBackward>)
output :  tensor([[124406.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(2538072.2500, grad_fn=<MseLossBackward>)
output :  tensor([[246816.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2285955., grad_fn=<MseLossBackward>)
output :  tensor([[240340.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9944e+09, grad_fn=<MseLossBackward>)
output :  tensor([[148809.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0309e+08, grad_fn=<MseLossBackward>)
output :  tensor([[83652.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1314e+08, grad_fn=<MseLossBackward>)
output :  tensor([[196120.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2063e+09, grad_fn=<MseLossBackward>)
output :  tensor([[83497.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(6239262.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139611.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(12362.6602, grad_fn=<MseLossBackward>)
output :  tensor([[75667.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(27917.7109, grad_fn=<MseLossBackward>)
output :  tensor([[143768.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(665091.2500, grad_fn=<MseLossBackward>)
output :  tensor([[178029.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(4119694.7500, grad_fn=<MseLossBackward>)
output :  tensor([[153806.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(93693.3828, grad_fn=<MseLossBackward>)
output :  tensor([[105133.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(5136810., grad_fn=<MseLossBackward>)
output :  tensor([[206999.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1827e+10, grad_fn=<MseLossBackward>)
output :  tensor([[129168.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(447435.5625, grad_fn=<MseLossBackward>)
output :  tensor([[267854.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4751e+08, grad_fn=<MseLossBackward>)
output :  tensor([[302793.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(51934992., grad_fn=<MseLossBackward>)
output :  tensor([[112708.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(27125218., grad_fn=<MseLossBackward>)
output :  tensor([[168692.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(14500150., grad_fn=<MseLossBackward>)
output :  tensor([[132850.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1756e+08, grad_fn=<MseLossBackward>)
output :  tensor([[138368.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(398851.4688, grad_fn=<MseLossBackward>)
output :  tensor([[127232.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(9103232., grad_fn=<MseLossBackward>)
output :  tensor([[126856.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(3448217., grad_fn=<MseLossBackward>)
output :  tensor([[134010.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0078e+08, grad_fn=<MseLossBackward>)
output :  tensor([[225644.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8949e+10, grad_fn=<MseLossBackward>)
output :  tensor([[191202.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2439e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144613.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(509305.2500, grad_fn=<MseLossBackward>)
output :  tensor([[131013.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(12346329., grad_fn=<MseLossBackward>)
output :  tensor([[112569.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(1741224.6250, grad_fn=<MseLossBackward>)
output :  tensor([[258164.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5876e+09, grad_fn=<MseLossBackward>)
output :  tensor([[133922.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1161410.3750, grad_fn=<MseLossBackward>)
output :  tensor([[199508.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(12192536., grad_fn=<MseLossBackward>)
output :  tensor([[105329.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(184141.5625, grad_fn=<MseLossBackward>)
output :  tensor([[141178.]], grad_fn=<AddmmBackward>)
loss:  tensor(1507984., grad_fn=<MseLossBackward>)
output :  tensor([[208885.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4380e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178523.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1895225.5000, grad_fn=<MseLossBackward>)
output :  tensor([[185112.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(12589.5410, grad_fn=<MseLossBackward>)
output :  tensor([[163603.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1140e+10, grad_fn=<MseLossBackward>)
output :  tensor([[302338.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0668e+09, grad_fn=<MseLossBackward>)
output :  tensor([[197945.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(2068.8284, grad_fn=<MseLossBackward>)
output :  tensor([[262451.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9715e+10, grad_fn=<MseLossBackward>)
output :  tensor([[223619.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7961e+09, grad_fn=<MseLossBackward>)
output :  tensor([[287591.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(8.6487e+08, grad_fn=<MseLossBackward>)
output :  tensor([[220961.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(9234476., grad_fn=<MseLossBackward>)
output :  tensor([[222176.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8840e+10, grad_fn=<MseLossBackward>)
output :  tensor([[198020.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1040814.4375, grad_fn=<MseLossBackward>)
output :  tensor([[158033.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4295e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134850.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(5523528., grad_fn=<MseLossBackward>)
output :  tensor([[133671.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3343755., grad_fn=<MseLossBackward>)
output :  tensor([[90551.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(200907.0469, grad_fn=<MseLossBackward>)
output :  tensor([[108826.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(683644.7500, grad_fn=<MseLossBackward>)
output :  tensor([[275544.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8468e+09, grad_fn=<MseLossBackward>)
output :  tensor([[235114.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(13035.2168, grad_fn=<MseLossBackward>)
output :  tensor([[146596.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2547864.5000, grad_fn=<MseLossBackward>)
output :  tensor([[134460.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(9236756., grad_fn=<MseLossBackward>)
output :  tensor([[172439.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1672536., grad_fn=<MseLossBackward>)
output :  tensor([[149032.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(14307661., grad_fn=<MseLossBackward>)
output :  tensor([[163990.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(9.3082e+08, grad_fn=<MseLossBackward>)
output :  tensor([[167132.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(4546690., grad_fn=<MseLossBackward>)
output :  tensor([[136242.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(574350.8125, grad_fn=<MseLossBackward>)
output :  tensor([[187964.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2855e+09, grad_fn=<MseLossBackward>)
output :  tensor([[110527.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(2167543., grad_fn=<MseLossBackward>)
output :  tensor([[166684.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(28252214., grad_fn=<MseLossBackward>)
output :  tensor([[119680.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(101980.4297, grad_fn=<MseLossBackward>)
output :  tensor([[83364.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(13217996., grad_fn=<MseLossBackward>)
output :  tensor([[178399.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2561550.2500, grad_fn=<MseLossBackward>)
output :  tensor([[110550.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(422530.4688, grad_fn=<MseLossBackward>)
output :  tensor([[238146.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(728008.8750, grad_fn=<MseLossBackward>)
output :  tensor([[244904.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(9051.7383, grad_fn=<MseLossBackward>)
output :  tensor([[135027.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(30547902., grad_fn=<MseLossBackward>)
output :  tensor([[112659.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(13690636., grad_fn=<MseLossBackward>)
output :  tensor([[287598.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2367e+10, grad_fn=<MseLossBackward>)
output :  tensor([[174550.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(9302595., grad_fn=<MseLossBackward>)
output :  tensor([[123902.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(1203803.2500, grad_fn=<MseLossBackward>)
output :  tensor([[142734.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1181e+08, grad_fn=<MseLossBackward>)
output :  tensor([[203251.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1553e+08, grad_fn=<MseLossBackward>)
output :  tensor([[139954.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1093887.2500, grad_fn=<MseLossBackward>)
output :  tensor([[158139.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4850e+10, grad_fn=<MseLossBackward>)
output :  tensor([[157049.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(9916890., grad_fn=<MseLossBackward>)
output :  tensor([[131016.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(2300222.5000, grad_fn=<MseLossBackward>)
output :  tensor([[249863.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6547e+10, grad_fn=<MseLossBackward>)
output :  tensor([[401752.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(61148.0156, grad_fn=<MseLossBackward>)
output :  tensor([[110815.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(3297090., grad_fn=<MseLossBackward>)
output :  tensor([[114922.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(12795767., grad_fn=<MseLossBackward>)
output :  tensor([[156611.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(8344696., grad_fn=<MseLossBackward>)
output :  tensor([[129603.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9517e+08, grad_fn=<MseLossBackward>)
output :  tensor([[162405.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5515e+09, grad_fn=<MseLossBackward>)
output :  tensor([[172393.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8930e+09, grad_fn=<MseLossBackward>)
output :  tensor([[107545.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(15567710., grad_fn=<MseLossBackward>)
output :  tensor([[141142.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(20199.5156, grad_fn=<MseLossBackward>)
output :  tensor([[363601.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(13636403., grad_fn=<MseLossBackward>)
output :  tensor([[206069.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2974e+09, grad_fn=<MseLossBackward>)
output :  tensor([[175075.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(180107.4062, grad_fn=<MseLossBackward>)
output :  tensor([[201443.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2122393.7500, grad_fn=<MseLossBackward>)
output :  tensor([[142975.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(15803855., grad_fn=<MseLossBackward>)
output :  tensor([[196641.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(4586490.5000, grad_fn=<MseLossBackward>)
output :  tensor([[134195.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1267e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179111.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(3565665., grad_fn=<MseLossBackward>)
output :  tensor([[240573.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2033877.1250, grad_fn=<MseLossBackward>)
output :  tensor([[175623.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2634839., grad_fn=<MseLossBackward>)
output :  tensor([[110671.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(7134408., grad_fn=<MseLossBackward>)
output :  tensor([[264690.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(16778.3438, grad_fn=<MseLossBackward>)
output :  tensor([[262598.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5872e+08, grad_fn=<MseLossBackward>)
output :  tensor([[122908.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(8316.5850, grad_fn=<MseLossBackward>)
output :  tensor([[215720.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5140e+09, grad_fn=<MseLossBackward>)
output :  tensor([[304796.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2039e+08, grad_fn=<MseLossBackward>)
output :  tensor([[208077.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1160905.2500, grad_fn=<MseLossBackward>)
output :  tensor([[216722.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5197e+10, grad_fn=<MseLossBackward>)
output :  tensor([[160289.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(5708590., grad_fn=<MseLossBackward>)
output :  tensor([[169836.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(23658.2852, grad_fn=<MseLossBackward>)
output :  tensor([[159963.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(9189898., grad_fn=<MseLossBackward>)
output :  tensor([[173371.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(11366169., grad_fn=<MseLossBackward>)
output :  tensor([[237897.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(9.0618e+08, grad_fn=<MseLossBackward>)
output :  tensor([[223344.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(37345276., grad_fn=<MseLossBackward>)
output :  tensor([[159030.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4474e+08, grad_fn=<MseLossBackward>)
output :  tensor([[119024.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(15806526., grad_fn=<MseLossBackward>)
output :  tensor([[176841.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(25092.5391, grad_fn=<MseLossBackward>)
output :  tensor([[179518.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4772e+09, grad_fn=<MseLossBackward>)
output :  tensor([[208160.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4766e+10, grad_fn=<MseLossBackward>)
output :  tensor([[137650.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(10356530., grad_fn=<MseLossBackward>)
output :  tensor([[153603.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0242e+09, grad_fn=<MseLossBackward>)
output :  tensor([[276351.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(421079.3125, grad_fn=<MseLossBackward>)
output :  tensor([[86545.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2389101.5000, grad_fn=<MseLossBackward>)
output :  tensor([[233803.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(7269595.5000, grad_fn=<MseLossBackward>)
output :  tensor([[261435.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0336e+11, grad_fn=<MseLossBackward>)
output :  tensor([[174340.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(18842110., grad_fn=<MseLossBackward>)
output :  tensor([[195922.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5270e+09, grad_fn=<MseLossBackward>)
output :  tensor([[153712.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1658139.1250, grad_fn=<MseLossBackward>)
output :  tensor([[207728.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8778e+09, grad_fn=<MseLossBackward>)
output :  tensor([[129049.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2481.2852, grad_fn=<MseLossBackward>)
output :  tensor([[147295.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(5269105., grad_fn=<MseLossBackward>)
output :  tensor([[167219.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1105e+08, grad_fn=<MseLossBackward>)
output :  tensor([[185022.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(684161.6250, grad_fn=<MseLossBackward>)
output :  tensor([[129507.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(12303872., grad_fn=<MseLossBackward>)
output :  tensor([[136057.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(195529.7812, grad_fn=<MseLossBackward>)
output :  tensor([[171869.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1279055., grad_fn=<MseLossBackward>)
output :  tensor([[197240.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7836e+09, grad_fn=<MseLossBackward>)
output :  tensor([[244503.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2261123., grad_fn=<MseLossBackward>)
output :  tensor([[155037.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1440.4397, grad_fn=<MseLossBackward>)
output :  tensor([[194784.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1476832.5000, grad_fn=<MseLossBackward>)
output :  tensor([[161451.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0456e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180485.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(970779.1250, grad_fn=<MseLossBackward>)
output :  tensor([[174225.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(32205092., grad_fn=<MseLossBackward>)
output :  tensor([[95323.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2811647.7500, grad_fn=<MseLossBackward>)
output :  tensor([[171949.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1675e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134558.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(194991.2344, grad_fn=<MseLossBackward>)
output :  tensor([[119265.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(18194024., grad_fn=<MseLossBackward>)
output :  tensor([[173004.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(990367.0625, grad_fn=<MseLossBackward>)
output :  tensor([[86687.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(2848790.2500, grad_fn=<MseLossBackward>)
output :  tensor([[286759.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(10499220., grad_fn=<MseLossBackward>)
output :  tensor([[166936.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(3749790.2500, grad_fn=<MseLossBackward>)
output :  tensor([[193985.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9372e+10, grad_fn=<MseLossBackward>)
output :  tensor([[247945.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3149e+08, grad_fn=<MseLossBackward>)
output :  tensor([[150125.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(764777.5625, grad_fn=<MseLossBackward>)
output :  tensor([[122589.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1989598.3750, grad_fn=<MseLossBackward>)
output :  tensor([[116394.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(12286175., grad_fn=<MseLossBackward>)
output :  tensor([[145092.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(9.0558e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176040.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(4164214.2500, grad_fn=<MseLossBackward>)
output :  tensor([[110663.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9316e+08, grad_fn=<MseLossBackward>)
output :  tensor([[216148.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0374e+10, grad_fn=<MseLossBackward>)
output :  tensor([[235895.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(31412872., grad_fn=<MseLossBackward>)
output :  tensor([[254475.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9801e+10, grad_fn=<MseLossBackward>)
output :  tensor([[223786.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3146e+08, grad_fn=<MseLossBackward>)
output :  tensor([[197799.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3853e+10, grad_fn=<MseLossBackward>)
output :  tensor([[189916.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(5838339.5000, grad_fn=<MseLossBackward>)
output :  tensor([[206391.]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7733e+10, grad_fn=<MseLossBackward>)
output :  tensor([[191167.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0977e+10, grad_fn=<MseLossBackward>)
output :  tensor([[177634.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1222199.3750, grad_fn=<MseLossBackward>)
output :  tensor([[152423.]], grad_fn=<AddmmBackward>)
loss:  tensor(178929., grad_fn=<MseLossBackward>)
output :  tensor([[335818.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1395351.5000, grad_fn=<MseLossBackward>)
output :  tensor([[210077.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3695405.5000, grad_fn=<MseLossBackward>)
output :  tensor([[160002.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0947, grad_fn=<MseLossBackward>)
output :  tensor([[190536.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5972e+09, grad_fn=<MseLossBackward>)
output :  tensor([[106785.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(3189461.2500, grad_fn=<MseLossBackward>)
output :  tensor([[274406.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8733e+10, grad_fn=<MseLossBackward>)
output :  tensor([[172820.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1165320.2500, grad_fn=<MseLossBackward>)
output :  tensor([[214941.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2078958.5000, grad_fn=<MseLossBackward>)
output :  tensor([[213073.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(62833116., grad_fn=<MseLossBackward>)
output :  tensor([[178779.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(177096.3125, grad_fn=<MseLossBackward>)
output :  tensor([[200019.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(3171682.7500, grad_fn=<MseLossBackward>)
output :  tensor([[157778.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(7717371., grad_fn=<MseLossBackward>)
output :  tensor([[146130.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1280e+09, grad_fn=<MseLossBackward>)
output :  tensor([[118475.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(604.0842, grad_fn=<MseLossBackward>)
output :  tensor([[140259.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(67129.5703, grad_fn=<MseLossBackward>)
output :  tensor([[147718.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1642442.5000, grad_fn=<MseLossBackward>)
output :  tensor([[201492.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6004e+10, grad_fn=<MseLossBackward>)
output :  tensor([[160904.]], grad_fn=<AddmmBackward>)
loss:  tensor(1971216., grad_fn=<MseLossBackward>)
output :  tensor([[101690.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(4796853., grad_fn=<MseLossBackward>)
output :  tensor([[223936.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5804e+08, grad_fn=<MseLossBackward>)
output :  tensor([[183091.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0948e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175894.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(348911.7188, grad_fn=<MseLossBackward>)
output :  tensor([[85420.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(11696828., grad_fn=<MseLossBackward>)
output :  tensor([[128527.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(765.3004, grad_fn=<MseLossBackward>)
output :  tensor([[217792.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(14384597., grad_fn=<MseLossBackward>)
output :  tensor([[144043.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1875.9727, grad_fn=<MseLossBackward>)
output :  tensor([[134505.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(20297418., grad_fn=<MseLossBackward>)
output :  tensor([[144509.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(3644698.5000, grad_fn=<MseLossBackward>)
output :  tensor([[177090.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5674e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144543.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(295273.3750, grad_fn=<MseLossBackward>)
output :  tensor([[160148.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(21982.6953, grad_fn=<MseLossBackward>)
output :  tensor([[212505.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(6221595., grad_fn=<MseLossBackward>)
output :  tensor([[136834.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0134e+09, grad_fn=<MseLossBackward>)
output :  tensor([[259467.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(19958556., grad_fn=<MseLossBackward>)
output :  tensor([[156927.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(6616631., grad_fn=<MseLossBackward>)
output :  tensor([[128465.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(1224.4531, grad_fn=<MseLossBackward>)
output :  tensor([[92710.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(5243992.5000, grad_fn=<MseLossBackward>)
output :  tensor([[155151.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9916e+09, grad_fn=<MseLossBackward>)
output :  tensor([[179540.]], grad_fn=<AddmmBackward>)
loss:  tensor(129600., grad_fn=<MseLossBackward>)
output :  tensor([[121298.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(638026.5000, grad_fn=<MseLossBackward>)
output :  tensor([[188452.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6400e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144376.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2090e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151055.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1335324.7500, grad_fn=<MseLossBackward>)
output :  tensor([[186196.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2414624.7500, grad_fn=<MseLossBackward>)
output :  tensor([[253944.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5313e+09, grad_fn=<MseLossBackward>)
output :  tensor([[92203.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(495308.0625, grad_fn=<MseLossBackward>)
output :  tensor([[241038.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1078936.6250, grad_fn=<MseLossBackward>)
output :  tensor([[131277.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(7713898.5000, grad_fn=<MseLossBackward>)
output :  tensor([[165856.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0009e+10, grad_fn=<MseLossBackward>)
output :  tensor([[112614.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5913e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176691.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(477610.5625, grad_fn=<MseLossBackward>)
output :  tensor([[161755.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9977e+08, grad_fn=<MseLossBackward>)
output :  tensor([[154838.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9238e+08, grad_fn=<MseLossBackward>)
output :  tensor([[235001.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(15987502., grad_fn=<MseLossBackward>)
output :  tensor([[224697.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1090e+09, grad_fn=<MseLossBackward>)
output :  tensor([[130515.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(12357092., grad_fn=<MseLossBackward>)
output :  tensor([[124045.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(3821841.7500, grad_fn=<MseLossBackward>)
output :  tensor([[222303.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(22058434., grad_fn=<MseLossBackward>)
output :  tensor([[227755.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(38994560., grad_fn=<MseLossBackward>)
output :  tensor([[226312.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(149914.1562, grad_fn=<MseLossBackward>)
output :  tensor([[146930.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1143228.7500, grad_fn=<MseLossBackward>)
output :  tensor([[213857.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(14877654., grad_fn=<MseLossBackward>)
output :  tensor([[131089.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2298e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134832.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(5438370., grad_fn=<MseLossBackward>)
output :  tensor([[311203.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(14416260., grad_fn=<MseLossBackward>)
output :  tensor([[138696.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(5304169., grad_fn=<MseLossBackward>)
output :  tensor([[120697.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8835e+09, grad_fn=<MseLossBackward>)
output :  tensor([[110382.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(779413.0625, grad_fn=<MseLossBackward>)
output :  tensor([[157362.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2915e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180493.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8796e+09, grad_fn=<MseLossBackward>)
output :  tensor([[176690.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(13618637., grad_fn=<MseLossBackward>)
output :  tensor([[193188.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(61017092., grad_fn=<MseLossBackward>)
output :  tensor([[95249.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(22564430., grad_fn=<MseLossBackward>)
output :  tensor([[181710.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(7347234., grad_fn=<MseLossBackward>)
output :  tensor([[174262.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(40479020., grad_fn=<MseLossBackward>)
output :  tensor([[137334.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2774879.2500, grad_fn=<MseLossBackward>)
output :  tensor([[264062.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(9.0321e+09, grad_fn=<MseLossBackward>)
output :  tensor([[141974.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2461e+09, grad_fn=<MseLossBackward>)
output :  tensor([[172933.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(4378.7168, grad_fn=<MseLossBackward>)
output :  tensor([[139773.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(51238.5664, grad_fn=<MseLossBackward>)
output :  tensor([[192186.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(69110128., grad_fn=<MseLossBackward>)
output :  tensor([[166299.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(13690347., grad_fn=<MseLossBackward>)
output :  tensor([[242734.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1601371.6250, grad_fn=<MseLossBackward>)
output :  tensor([[132810.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2854621.5000, grad_fn=<MseLossBackward>)
output :  tensor([[150418.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1141825.8750, grad_fn=<MseLossBackward>)
output :  tensor([[213444.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2420406.7500, grad_fn=<MseLossBackward>)
output :  tensor([[161897.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(9627348., grad_fn=<MseLossBackward>)
output :  tensor([[186256.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(7528421.5000, grad_fn=<MseLossBackward>)
output :  tensor([[132657.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9392e+08, grad_fn=<MseLossBackward>)
output :  tensor([[132485.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(12148819., grad_fn=<MseLossBackward>)
output :  tensor([[143580.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(12823225., grad_fn=<MseLossBackward>)
output :  tensor([[204566.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2164e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166585.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6611e+09, grad_fn=<MseLossBackward>)
output :  tensor([[74648.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1458e+08, grad_fn=<MseLossBackward>)
output :  tensor([[93652.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(83769112., grad_fn=<MseLossBackward>)
output :  tensor([[252323.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(940445.3750, grad_fn=<MseLossBackward>)
output :  tensor([[206170.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5119e+09, grad_fn=<MseLossBackward>)
output :  tensor([[111761.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(10490868., grad_fn=<MseLossBackward>)
output :  tensor([[159515.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8312e+08, grad_fn=<MseLossBackward>)
output :  tensor([[207143.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6529e+08, grad_fn=<MseLossBackward>)
output :  tensor([[182483.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6591e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159730.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(22382066., grad_fn=<MseLossBackward>)
output :  tensor([[170966.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(933608.8750, grad_fn=<MseLossBackward>)
output :  tensor([[114351.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(419995.1250, grad_fn=<MseLossBackward>)
output :  tensor([[160973.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(35681024., grad_fn=<MseLossBackward>)
output :  tensor([[192521.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0674e+08, grad_fn=<MseLossBackward>)
output :  tensor([[220778.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1635201.5000, grad_fn=<MseLossBackward>)
output :  tensor([[248405.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4661e+11, grad_fn=<MseLossBackward>)
output :  tensor([[146148.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(725078.8750, grad_fn=<MseLossBackward>)
output :  tensor([[108679.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(39825.1914, grad_fn=<MseLossBackward>)
output :  tensor([[170355.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3328e+08, grad_fn=<MseLossBackward>)
output :  tensor([[152524.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(4098094.2500, grad_fn=<MseLossBackward>)
output :  tensor([[234080.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(8520926., grad_fn=<MseLossBackward>)
output :  tensor([[117727.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(7441131.5000, grad_fn=<MseLossBackward>)
output :  tensor([[186736.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(14719811., grad_fn=<MseLossBackward>)
output :  tensor([[187922.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1494544.5000, grad_fn=<MseLossBackward>)
output :  tensor([[164325.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4234e+10, grad_fn=<MseLossBackward>)
output :  tensor([[92427.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3059e+08, grad_fn=<MseLossBackward>)
output :  tensor([[237584.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2004348., grad_fn=<MseLossBackward>)
output :  tensor([[178052.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(4211730., grad_fn=<MseLossBackward>)
output :  tensor([[141369.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1875273.5000, grad_fn=<MseLossBackward>)
output :  tensor([[235582.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(339215.2500, grad_fn=<MseLossBackward>)
output :  tensor([[165935.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(8619087., grad_fn=<MseLossBackward>)
output :  tensor([[207090.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3903e+10, grad_fn=<MseLossBackward>)
output :  tensor([[131353.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(13294683., grad_fn=<MseLossBackward>)
output :  tensor([[187513.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5096e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134462.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2364098.5000, grad_fn=<MseLossBackward>)
output :  tensor([[226097.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(98053008., grad_fn=<MseLossBackward>)
output :  tensor([[224307.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6012e+08, grad_fn=<MseLossBackward>)
output :  tensor([[92922.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(8542650., grad_fn=<MseLossBackward>)
output :  tensor([[159360.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(5422.9414, grad_fn=<MseLossBackward>)
output :  tensor([[247538.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5213e+10, grad_fn=<MseLossBackward>)
output :  tensor([[147109.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(4448013., grad_fn=<MseLossBackward>)
output :  tensor([[108476.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7203e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164870.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(137328.1406, grad_fn=<MseLossBackward>)
output :  tensor([[143602.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(157621.4062, grad_fn=<MseLossBackward>)
output :  tensor([[129029.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(688679.5625, grad_fn=<MseLossBackward>)
output :  tensor([[188996.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9005e+09, grad_fn=<MseLossBackward>)
output :  tensor([[125020.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(6351384.5000, grad_fn=<MseLossBackward>)
output :  tensor([[150838.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1349953.5000, grad_fn=<MseLossBackward>)
output :  tensor([[169940.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3272537.5000, grad_fn=<MseLossBackward>)
output :  tensor([[150958.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1696.4102, grad_fn=<MseLossBackward>)
output :  tensor([[161563.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1787276.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135860.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2151e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130633.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1867706.6250, grad_fn=<MseLossBackward>)
output :  tensor([[156021.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8972e+08, grad_fn=<MseLossBackward>)
output :  tensor([[145740.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2522885.5000, grad_fn=<MseLossBackward>)
output :  tensor([[160005.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(3041972., grad_fn=<MseLossBackward>)
output :  tensor([[134787.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1938e+08, grad_fn=<MseLossBackward>)
output :  tensor([[150006.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1456396.3750, grad_fn=<MseLossBackward>)
output :  tensor([[186003.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3984577.5000, grad_fn=<MseLossBackward>)
output :  tensor([[169476.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(226873.5938, grad_fn=<MseLossBackward>)
output :  tensor([[181477.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2181575.2500, grad_fn=<MseLossBackward>)
output :  tensor([[218629.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1878227.3750, grad_fn=<MseLossBackward>)
output :  tensor([[113225.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(28359952., grad_fn=<MseLossBackward>)
output :  tensor([[136184.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2735e+08, grad_fn=<MseLossBackward>)
output :  tensor([[283619.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(5664995., grad_fn=<MseLossBackward>)
output :  tensor([[115040.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(920970.1250, grad_fn=<MseLossBackward>)
output :  tensor([[175552.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9756e+09, grad_fn=<MseLossBackward>)
output :  tensor([[181791.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(10294272., grad_fn=<MseLossBackward>)
output :  tensor([[182905.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(6731511.5000, grad_fn=<MseLossBackward>)
output :  tensor([[252200.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1982e+08, grad_fn=<MseLossBackward>)
output :  tensor([[222107.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(11549.5322, grad_fn=<MseLossBackward>)
output :  tensor([[126795.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3662e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173337.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1360e+08, grad_fn=<MseLossBackward>)
output :  tensor([[125041.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1084559.5000, grad_fn=<MseLossBackward>)
output :  tensor([[184797.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4507e+10, grad_fn=<MseLossBackward>)
output :  tensor([[153651.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(424757.6875, grad_fn=<MseLossBackward>)
output :  tensor([[153671.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(51437136., grad_fn=<MseLossBackward>)
output :  tensor([[204364.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(3745132., grad_fn=<MseLossBackward>)
output :  tensor([[144878.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5323e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176789.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(623162.2500, grad_fn=<MseLossBackward>)
output :  tensor([[252324.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3851e+08, grad_fn=<MseLossBackward>)
output :  tensor([[145742.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(5097294., grad_fn=<MseLossBackward>)
output :  tensor([[202062.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(363401.7500, grad_fn=<MseLossBackward>)
output :  tensor([[161257.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1708780., grad_fn=<MseLossBackward>)
output :  tensor([[123133.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2343e+09, grad_fn=<MseLossBackward>)
output :  tensor([[142035.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(39502404., grad_fn=<MseLossBackward>)
output :  tensor([[179953.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(16375300., grad_fn=<MseLossBackward>)
output :  tensor([[198537.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(72888376., grad_fn=<MseLossBackward>)
output :  tensor([[233186.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1152e+09, grad_fn=<MseLossBackward>)
output :  tensor([[255709.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1665390.2500, grad_fn=<MseLossBackward>)
output :  tensor([[189413.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6793e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144573.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8168e+09, grad_fn=<MseLossBackward>)
output :  tensor([[143415.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1175564.1250, grad_fn=<MseLossBackward>)
output :  tensor([[71516.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9330e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130661.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(18820074., grad_fn=<MseLossBackward>)
output :  tensor([[130823.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(3698590., grad_fn=<MseLossBackward>)
output :  tensor([[155830.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(3349986.7500, grad_fn=<MseLossBackward>)
output :  tensor([[129058.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(4237744., grad_fn=<MseLossBackward>)
output :  tensor([[75552.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(897208.5625, grad_fn=<MseLossBackward>)
output :  tensor([[81301.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(487782.1875, grad_fn=<MseLossBackward>)
output :  tensor([[241911.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(98242168., grad_fn=<MseLossBackward>)
output :  tensor([[139592.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3398e+08, grad_fn=<MseLossBackward>)
output :  tensor([[138805.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(68974320., grad_fn=<MseLossBackward>)
output :  tensor([[170408.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(11616275., grad_fn=<MseLossBackward>)
output :  tensor([[238251.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(10572354., grad_fn=<MseLossBackward>)
output :  tensor([[190929.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1464364.7500, grad_fn=<MseLossBackward>)
output :  tensor([[156824.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(679413.8125, grad_fn=<MseLossBackward>)
output :  tensor([[199609.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2920894.7500, grad_fn=<MseLossBackward>)
output :  tensor([[205184.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0122e+09, grad_fn=<MseLossBackward>)
output :  tensor([[134017.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(8893442., grad_fn=<MseLossBackward>)
output :  tensor([[154713.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(82315.1953, grad_fn=<MseLossBackward>)
output :  tensor([[134725.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1625186.7500, grad_fn=<MseLossBackward>)
output :  tensor([[201392.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1840e+08, grad_fn=<MseLossBackward>)
output :  tensor([[156247.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(5051045.5000, grad_fn=<MseLossBackward>)
output :  tensor([[137123.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9030e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145448.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(300526.6562, grad_fn=<MseLossBackward>)
output :  tensor([[207676.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(18692246., grad_fn=<MseLossBackward>)
output :  tensor([[102029.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0119e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166470.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1059419.8750, grad_fn=<MseLossBackward>)
output :  tensor([[129465.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(2148766.5000, grad_fn=<MseLossBackward>)
output :  tensor([[146002.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(995037.4375, grad_fn=<MseLossBackward>)
output :  tensor([[104245.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7525e+09, grad_fn=<MseLossBackward>)
output :  tensor([[138257.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(573545.8750, grad_fn=<MseLossBackward>)
output :  tensor([[235245.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(569341., grad_fn=<MseLossBackward>)
output :  tensor([[146902.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(3617841.7500, grad_fn=<MseLossBackward>)
output :  tensor([[138145.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(416811.4688, grad_fn=<MseLossBackward>)
output :  tensor([[163954.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2927e+09, grad_fn=<MseLossBackward>)
output :  tensor([[271473.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(42592348., grad_fn=<MseLossBackward>)
output :  tensor([[173483.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2300767.5000, grad_fn=<MseLossBackward>)
output :  tensor([[106074.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(10878762., grad_fn=<MseLossBackward>)
output :  tensor([[202159.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6761e+09, grad_fn=<MseLossBackward>)
output :  tensor([[160185.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1405854.8750, grad_fn=<MseLossBackward>)
output :  tensor([[162682.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6115e+10, grad_fn=<MseLossBackward>)
output :  tensor([[99927.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(2647612., grad_fn=<MseLossBackward>)
output :  tensor([[123535.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4104.0039, grad_fn=<MseLossBackward>)
output :  tensor([[158656.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(7056577., grad_fn=<MseLossBackward>)
output :  tensor([[140884.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(781815.1875, grad_fn=<MseLossBackward>)
output :  tensor([[201191.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1419039.3750, grad_fn=<MseLossBackward>)
output :  tensor([[139226.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(7690655.5000, grad_fn=<MseLossBackward>)
output :  tensor([[260860.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2014980.2500, grad_fn=<MseLossBackward>)
output :  tensor([[127192.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1691e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164702.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(635831.8125, grad_fn=<MseLossBackward>)
output :  tensor([[188839.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(115005.7656, grad_fn=<MseLossBackward>)
output :  tensor([[124510.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1055e+08, grad_fn=<MseLossBackward>)
output :  tensor([[255247.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(27533796., grad_fn=<MseLossBackward>)
output :  tensor([[158336.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2157e+08, grad_fn=<MseLossBackward>)
output :  tensor([[244409.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(884481.5000, grad_fn=<MseLossBackward>)
output :  tensor([[143277.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(521848.2188, grad_fn=<MseLossBackward>)
output :  tensor([[209683.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(99994.2969, grad_fn=<MseLossBackward>)
output :  tensor([[175592.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(10191757., grad_fn=<MseLossBackward>)
output :  tensor([[155749.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3060859.5000, grad_fn=<MseLossBackward>)
output :  tensor([[115553.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(5986318., grad_fn=<MseLossBackward>)
output :  tensor([[239873.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2294e+09, grad_fn=<MseLossBackward>)
output :  tensor([[240305.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(93110.8047, grad_fn=<MseLossBackward>)
output :  tensor([[152637.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(489584.4688, grad_fn=<MseLossBackward>)
output :  tensor([[253945.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(910593.0625, grad_fn=<MseLossBackward>)
output :  tensor([[125585.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2280e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178801.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(7849978., grad_fn=<MseLossBackward>)
output :  tensor([[162141.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(4586959., grad_fn=<MseLossBackward>)
output :  tensor([[134618.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(13092864., grad_fn=<MseLossBackward>)
output :  tensor([[192563.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9770e+09, grad_fn=<MseLossBackward>)
output :  tensor([[165422.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2024884.5000, grad_fn=<MseLossBackward>)
output :  tensor([[166613.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(13059528., grad_fn=<MseLossBackward>)
output :  tensor([[157245.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(569671.1250, grad_fn=<MseLossBackward>)
output :  tensor([[153519.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(13100780., grad_fn=<MseLossBackward>)
output :  tensor([[175004.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2909e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159363.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(404615.2500, grad_fn=<MseLossBackward>)
output :  tensor([[380428.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(12539345., grad_fn=<MseLossBackward>)
output :  tensor([[134086.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(50211616., grad_fn=<MseLossBackward>)
output :  tensor([[128546.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8530e+09, grad_fn=<MseLossBackward>)
output :  tensor([[279597.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2608931.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163847.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(3412736.7500, grad_fn=<MseLossBackward>)
output :  tensor([[131972.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3161e+08, grad_fn=<MseLossBackward>)
output :  tensor([[243267.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2697e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176738.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(14146414., grad_fn=<MseLossBackward>)
output :  tensor([[149758.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(5022781.5000, grad_fn=<MseLossBackward>)
output :  tensor([[143862.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1293479.7500, grad_fn=<MseLossBackward>)
output :  tensor([[154440.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0767e+08, grad_fn=<MseLossBackward>)
output :  tensor([[103018.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(9108607., grad_fn=<MseLossBackward>)
output :  tensor([[74252.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0315e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163254.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3047588.5000, grad_fn=<MseLossBackward>)
output :  tensor([[191030.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3667e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161012.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(9076851., grad_fn=<MseLossBackward>)
output :  tensor([[155103.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(5744261., grad_fn=<MseLossBackward>)
output :  tensor([[135118.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(5435965., grad_fn=<MseLossBackward>)
output :  tensor([[204068.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3539454.2500, grad_fn=<MseLossBackward>)
output :  tensor([[140727.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(7439341.5000, grad_fn=<MseLossBackward>)
output :  tensor([[183135.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6095e+10, grad_fn=<MseLossBackward>)
output :  tensor([[147833.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(3361493., grad_fn=<MseLossBackward>)
output :  tensor([[108969.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7441e+08, grad_fn=<MseLossBackward>)
output :  tensor([[92789.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(1465480.5000, grad_fn=<MseLossBackward>)
output :  tensor([[175011.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(124.4619, grad_fn=<MseLossBackward>)
output :  tensor([[260813.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(170853.0625, grad_fn=<MseLossBackward>)
output :  tensor([[143280.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(3169623.7500, grad_fn=<MseLossBackward>)
output :  tensor([[158359.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2356273., grad_fn=<MseLossBackward>)
output :  tensor([[133266.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(587666., grad_fn=<MseLossBackward>)
output :  tensor([[152472.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(8833341., grad_fn=<MseLossBackward>)
output :  tensor([[166613.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1656248.3750, grad_fn=<MseLossBackward>)
output :  tensor([[125796.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1449315., grad_fn=<MseLossBackward>)
output :  tensor([[172272.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4381e+08, grad_fn=<MseLossBackward>)
output :  tensor([[156214.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(617476.7500, grad_fn=<MseLossBackward>)
output :  tensor([[117968.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2156675.7500, grad_fn=<MseLossBackward>)
output :  tensor([[162266.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0033e+09, grad_fn=<MseLossBackward>)
output :  tensor([[51384.0117]], grad_fn=<AddmmBackward>)
loss:  tensor(379441.5625, grad_fn=<MseLossBackward>)
output :  tensor([[233516.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2384e+09, grad_fn=<MseLossBackward>)
output :  tensor([[202515.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2295319.7500, grad_fn=<MseLossBackward>)
output :  tensor([[182825.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(4728246.5000, grad_fn=<MseLossBackward>)
output :  tensor([[104814.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(1404317.6250, grad_fn=<MseLossBackward>)
output :  tensor([[91232.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(17914982., grad_fn=<MseLossBackward>)
output :  tensor([[129259.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1536e+08, grad_fn=<MseLossBackward>)
output :  tensor([[222170.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1595e+09, grad_fn=<MseLossBackward>)
output :  tensor([[204783.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(7380136.5000, grad_fn=<MseLossBackward>)
output :  tensor([[166913.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(3662917.5000, grad_fn=<MseLossBackward>)
output :  tensor([[175375.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0326e+09, grad_fn=<MseLossBackward>)
output :  tensor([[188854.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1313244.3750, grad_fn=<MseLossBackward>)
output :  tensor([[88718.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2954423.7500, grad_fn=<MseLossBackward>)
output :  tensor([[139325.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(455561.7188, grad_fn=<MseLossBackward>)
output :  tensor([[111876.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(1896064.5000, grad_fn=<MseLossBackward>)
output :  tensor([[148445.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5588e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172186.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6963e+09, grad_fn=<MseLossBackward>)
output :  tensor([[196107.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(79081280., grad_fn=<MseLossBackward>)
output :  tensor([[180398.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(158677.7500, grad_fn=<MseLossBackward>)
output :  tensor([[99576.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(9466583., grad_fn=<MseLossBackward>)
output :  tensor([[118633.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1285530.7500, grad_fn=<MseLossBackward>)
output :  tensor([[161013.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2838e+08, grad_fn=<MseLossBackward>)
output :  tensor([[200413.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(170607.7188, grad_fn=<MseLossBackward>)
output :  tensor([[140379.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(13108699., grad_fn=<MseLossBackward>)
train_loss: [2.563039e+09]
epoch_result tensor([0.])
output :  tensor([[157258.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1542525.2500, grad_fn=<MseLossBackward>)
output :  tensor([[122536.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(288075.4062, grad_fn=<MseLossBackward>)
output :  tensor([[196405.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(4859544.5000, grad_fn=<MseLossBackward>)
output :  tensor([[177359.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(129127.9297, grad_fn=<MseLossBackward>)
output :  tensor([[151116.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2272e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128335.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(112355.8984, grad_fn=<MseLossBackward>)
output :  tensor([[141026.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(700.5947, grad_fn=<MseLossBackward>)
output :  tensor([[119182.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(33431.8359, grad_fn=<MseLossBackward>)
output :  tensor([[66199.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(59277608., grad_fn=<MseLossBackward>)
output :  tensor([[165868.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(17374.5352, grad_fn=<MseLossBackward>)
output :  tensor([[138138.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3466055., grad_fn=<MseLossBackward>)
output :  tensor([[223701.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1685818.2500, grad_fn=<MseLossBackward>)
output :  tensor([[165846.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(9947026., grad_fn=<MseLossBackward>)
output :  tensor([[250579.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(773300.3750, grad_fn=<MseLossBackward>)
output :  tensor([[59092.3086]], grad_fn=<AddmmBackward>)
loss:  tensor(16746990., grad_fn=<MseLossBackward>)
output :  tensor([[160482.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5546e+08, grad_fn=<MseLossBackward>)
output :  tensor([[171520.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(12105289., grad_fn=<MseLossBackward>)
output :  tensor([[146393.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0215e+08, grad_fn=<MseLossBackward>)
output :  tensor([[279445.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(19761914., grad_fn=<MseLossBackward>)
output :  tensor([[194981.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(4074910., grad_fn=<MseLossBackward>)
output :  tensor([[139931.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4294e+10, grad_fn=<MseLossBackward>)
output :  tensor([[196392.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(6318389., grad_fn=<MseLossBackward>)
output :  tensor([[177906.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2084e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151742.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(550842.3125, grad_fn=<MseLossBackward>)
output :  tensor([[171707.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2914062.5000, grad_fn=<MseLossBackward>)
output :  tensor([[87679.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(5196262.5000, grad_fn=<MseLossBackward>)
output :  tensor([[170033.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2528e+09, grad_fn=<MseLossBackward>)
output :  tensor([[185723.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(523610.5312, grad_fn=<MseLossBackward>)
output :  tensor([[209004.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1619e+09, grad_fn=<MseLossBackward>)
output :  tensor([[110668.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(446484.9688, grad_fn=<MseLossBackward>)
output :  tensor([[170438.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(315071.7188, grad_fn=<MseLossBackward>)
output :  tensor([[138684.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(4771835.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128711.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(83074.5547, grad_fn=<MseLossBackward>)
output :  tensor([[121929.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(5903457.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145660.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2140e+08, grad_fn=<MseLossBackward>)
output :  tensor([[167952.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1623e+10, grad_fn=<MseLossBackward>)
output :  tensor([[147633.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(4271068., grad_fn=<MseLossBackward>)
output :  tensor([[180322.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(103955.8672, grad_fn=<MseLossBackward>)
output :  tensor([[143452.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(6015829.5000, grad_fn=<MseLossBackward>)
output :  tensor([[107229.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9687e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134528.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4756e+09, grad_fn=<MseLossBackward>)
output :  tensor([[133755.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1547847., grad_fn=<MseLossBackward>)
output :  tensor([[134359.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(54164080., grad_fn=<MseLossBackward>)
output :  tensor([[223236.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(3109656.7500, grad_fn=<MseLossBackward>)
output :  tensor([[130369.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(3537426.2500, grad_fn=<MseLossBackward>)
output :  tensor([[150227.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1507677., grad_fn=<MseLossBackward>)
output :  tensor([[112614.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(377811.9062, grad_fn=<MseLossBackward>)
output :  tensor([[163207.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(10288658., grad_fn=<MseLossBackward>)
output :  tensor([[146978.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3060e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192946.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(896098.8750, grad_fn=<MseLossBackward>)
output :  tensor([[135993.]], grad_fn=<AddmmBackward>)
loss:  tensor(2380849., grad_fn=<MseLossBackward>)
output :  tensor([[115694.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(32429644., grad_fn=<MseLossBackward>)
output :  tensor([[231877.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(4503812.5000, grad_fn=<MseLossBackward>)
output :  tensor([[167060.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1557e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164073.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(25740244., grad_fn=<MseLossBackward>)
output :  tensor([[204362.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8270e+10, grad_fn=<MseLossBackward>)
output :  tensor([[247956.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1245e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143318.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(32783.6289, grad_fn=<MseLossBackward>)
output :  tensor([[137006.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(9040733., grad_fn=<MseLossBackward>)
output :  tensor([[153616.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1912948.3750, grad_fn=<MseLossBackward>)
output :  tensor([[135930.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(35174536., grad_fn=<MseLossBackward>)
output :  tensor([[179144.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5376e+09, grad_fn=<MseLossBackward>)
output :  tensor([[183182.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(842179., grad_fn=<MseLossBackward>)
output :  tensor([[164221.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(7403926., grad_fn=<MseLossBackward>)
output :  tensor([[147791.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(22961766., grad_fn=<MseLossBackward>)
output :  tensor([[144919.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(5855568., grad_fn=<MseLossBackward>)
output :  tensor([[141924.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(9458412., grad_fn=<MseLossBackward>)
output :  tensor([[172437.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5223e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195576.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5897e+08, grad_fn=<MseLossBackward>)
output :  tensor([[140418.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(15357091., grad_fn=<MseLossBackward>)
output :  tensor([[176515.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(21298370., grad_fn=<MseLossBackward>)
output :  tensor([[181503.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(253590.9219, grad_fn=<MseLossBackward>)
output :  tensor([[118418.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(11683311., grad_fn=<MseLossBackward>)
output :  tensor([[221229.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(52706.1172, grad_fn=<MseLossBackward>)
output :  tensor([[188246.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(22527186., grad_fn=<MseLossBackward>)
output :  tensor([[127193.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2869106.7500, grad_fn=<MseLossBackward>)
output :  tensor([[195123.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1895139.3750, grad_fn=<MseLossBackward>)
output :  tensor([[172009.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(8354448.5000, grad_fn=<MseLossBackward>)
output :  tensor([[214852.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9377e+10, grad_fn=<MseLossBackward>)
output :  tensor([[209031.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(3875792., grad_fn=<MseLossBackward>)
output :  tensor([[164597.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1288e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194800.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(90262.6875, grad_fn=<MseLossBackward>)
output :  tensor([[112277.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(522209.4688, grad_fn=<MseLossBackward>)
output :  tensor([[115443.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(8663732., grad_fn=<MseLossBackward>)
output :  tensor([[108968.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(9187340., grad_fn=<MseLossBackward>)
output :  tensor([[147794.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(988284.5000, grad_fn=<MseLossBackward>)
output :  tensor([[160106.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3320e+10, grad_fn=<MseLossBackward>)
output :  tensor([[181521.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2314059., grad_fn=<MseLossBackward>)
output :  tensor([[130531.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(9191271., grad_fn=<MseLossBackward>)
output :  tensor([[148022.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(9138151., grad_fn=<MseLossBackward>)
output :  tensor([[181136.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1378e+09, grad_fn=<MseLossBackward>)
output :  tensor([[116728.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(29541.0156, grad_fn=<MseLossBackward>)
output :  tensor([[198018.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1037087.6250, grad_fn=<MseLossBackward>)
output :  tensor([[147636.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(6950720.5000, grad_fn=<MseLossBackward>)
output :  tensor([[211573.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1760348.5000, grad_fn=<MseLossBackward>)
output :  tensor([[129004.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(9026316., grad_fn=<MseLossBackward>)
output :  tensor([[240518.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(60980724., grad_fn=<MseLossBackward>)
output :  tensor([[241542.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8885e+09, grad_fn=<MseLossBackward>)
output :  tensor([[147759.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6763e+08, grad_fn=<MseLossBackward>)
output :  tensor([[85068.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7931e+08, grad_fn=<MseLossBackward>)
output :  tensor([[197996.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9141e+09, grad_fn=<MseLossBackward>)
output :  tensor([[81416.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(173661.0312, grad_fn=<MseLossBackward>)
output :  tensor([[137901.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2554453., grad_fn=<MseLossBackward>)
output :  tensor([[75231.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(71895.2031, grad_fn=<MseLossBackward>)
output :  tensor([[143866.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(834996.1875, grad_fn=<MseLossBackward>)
output :  tensor([[175161.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(702610.6875, grad_fn=<MseLossBackward>)
output :  tensor([[153352.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(21747.0312, grad_fn=<MseLossBackward>)
output :  tensor([[107946.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(298525.6250, grad_fn=<MseLossBackward>)
output :  tensor([[203289.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2647e+10, grad_fn=<MseLossBackward>)
output :  tensor([[125811.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(7226940., grad_fn=<MseLossBackward>)
output :  tensor([[269157.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1756e+08, grad_fn=<MseLossBackward>)
output :  tensor([[302252.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(60018916., grad_fn=<MseLossBackward>)
output :  tensor([[107078.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(177510.8125, grad_fn=<MseLossBackward>)
output :  tensor([[171706.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(630187.8750, grad_fn=<MseLossBackward>)
output :  tensor([[133570.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5387e+08, grad_fn=<MseLossBackward>)
output :  tensor([[147491.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(72100528., grad_fn=<MseLossBackward>)
output :  tensor([[129838.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(169692.5000, grad_fn=<MseLossBackward>)
output :  tensor([[123302.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(2882434.7500, grad_fn=<MseLossBackward>)
output :  tensor([[134567.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2839e+08, grad_fn=<MseLossBackward>)
output :  tensor([[226127.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8759e+10, grad_fn=<MseLossBackward>)
output :  tensor([[190438.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2669e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143442.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(209120.4375, grad_fn=<MseLossBackward>)
output :  tensor([[125616.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(3546424.5000, grad_fn=<MseLossBackward>)
output :  tensor([[112211.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(924512.3125, grad_fn=<MseLossBackward>)
output :  tensor([[256685.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7670e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136535.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2359056., grad_fn=<MseLossBackward>)
output :  tensor([[208550.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(30807182., grad_fn=<MseLossBackward>)
output :  tensor([[101849.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(9303358., grad_fn=<MseLossBackward>)
output :  tensor([[138446.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2261687., grad_fn=<MseLossBackward>)
output :  tensor([[209897.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1325e+08, grad_fn=<MseLossBackward>)
output :  tensor([[182883.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(8902764., grad_fn=<MseLossBackward>)
output :  tensor([[186678.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(2817309.7500, grad_fn=<MseLossBackward>)
output :  tensor([[163914.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1050e+10, grad_fn=<MseLossBackward>)
output :  tensor([[298475.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3341e+09, grad_fn=<MseLossBackward>)
output :  tensor([[197882.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(300.2639, grad_fn=<MseLossBackward>)
output :  tensor([[260834.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0172e+10, grad_fn=<MseLossBackward>)
output :  tensor([[222363.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9041e+09, grad_fn=<MseLossBackward>)
output :  tensor([[287610.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(8.6376e+08, grad_fn=<MseLossBackward>)
output :  tensor([[225969.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3879668.7500, grad_fn=<MseLossBackward>)
output :  tensor([[224082.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8196e+10, grad_fn=<MseLossBackward>)
output :  tensor([[193139.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(14900927., grad_fn=<MseLossBackward>)
output :  tensor([[158789.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8744e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131484.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1031367.1875, grad_fn=<MseLossBackward>)
output :  tensor([[135839.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(114952.7812, grad_fn=<MseLossBackward>)
output :  tensor([[92137.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1293337.5000, grad_fn=<MseLossBackward>)
output :  tensor([[104879.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(9736496., grad_fn=<MseLossBackward>)
output :  tensor([[274726.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9348e+09, grad_fn=<MseLossBackward>)
output :  tensor([[237271.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(5159641.5000, grad_fn=<MseLossBackward>)
output :  tensor([[146158.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1343027.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139579.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(4322436., grad_fn=<MseLossBackward>)
output :  tensor([[172088.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2703044.2500, grad_fn=<MseLossBackward>)
output :  tensor([[144729.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(270757.6250, grad_fn=<MseLossBackward>)
output :  tensor([[164769.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8389e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165391.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(153247.7812, grad_fn=<MseLossBackward>)
output :  tensor([[136797.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(40968.2891, grad_fn=<MseLossBackward>)
output :  tensor([[188315.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3317e+09, grad_fn=<MseLossBackward>)
output :  tensor([[111528.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(221863.0781, grad_fn=<MseLossBackward>)
output :  tensor([[175869.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(14972305., grad_fn=<MseLossBackward>)
output :  tensor([[122474.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(6124117., grad_fn=<MseLossBackward>)
output :  tensor([[87222.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(49485.3945, grad_fn=<MseLossBackward>)
output :  tensor([[179617.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(146473.6406, grad_fn=<MseLossBackward>)
output :  tensor([[108966.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(870809.7500, grad_fn=<MseLossBackward>)
output :  tensor([[240735.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(3012556.7500, grad_fn=<MseLossBackward>)
output :  tensor([[247566.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(6587243., grad_fn=<MseLossBackward>)
output :  tensor([[128970.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(280022.8750, grad_fn=<MseLossBackward>)
output :  tensor([[111048.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(4366696., grad_fn=<MseLossBackward>)
output :  tensor([[289662.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1754e+10, grad_fn=<MseLossBackward>)
output :  tensor([[174319.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(7947113.5000, grad_fn=<MseLossBackward>)
output :  tensor([[130233.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(27386088., grad_fn=<MseLossBackward>)
output :  tensor([[144277.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9051e+08, grad_fn=<MseLossBackward>)
output :  tensor([[203423.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1186e+08, grad_fn=<MseLossBackward>)
output :  tensor([[140247.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(566726.6875, grad_fn=<MseLossBackward>)
output :  tensor([[157489.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5009e+10, grad_fn=<MseLossBackward>)
output :  tensor([[155755.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(3443982., grad_fn=<MseLossBackward>)
output :  tensor([[130881.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1909319.3750, grad_fn=<MseLossBackward>)
output :  tensor([[249221.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6713e+10, grad_fn=<MseLossBackward>)
output :  tensor([[397104.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(23967756., grad_fn=<MseLossBackward>)
output :  tensor([[111491.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(6208779., grad_fn=<MseLossBackward>)
output :  tensor([[123642.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(26446672., grad_fn=<MseLossBackward>)
output :  tensor([[158218.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1642242.2500, grad_fn=<MseLossBackward>)
output :  tensor([[128228.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6416e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163873.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3787e+09, grad_fn=<MseLossBackward>)
output :  tensor([[172988.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9675e+09, grad_fn=<MseLossBackward>)
output :  tensor([[105028.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(2039831.1250, grad_fn=<MseLossBackward>)
output :  tensor([[141175.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(30959.5020, grad_fn=<MseLossBackward>)
output :  tensor([[364673.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(6869477., grad_fn=<MseLossBackward>)
output :  tensor([[205082.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3930e+09, grad_fn=<MseLossBackward>)
output :  tensor([[179204.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(13725173., grad_fn=<MseLossBackward>)
output :  tensor([[205817.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(8513812., grad_fn=<MseLossBackward>)
output :  tensor([[141106.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(4439251.5000, grad_fn=<MseLossBackward>)
output :  tensor([[194310.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(36076.2539, grad_fn=<MseLossBackward>)
output :  tensor([[134564.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3248e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181092.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(8512.9453, grad_fn=<MseLossBackward>)
output :  tensor([[240858.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1303057.8750, grad_fn=<MseLossBackward>)
output :  tensor([[171151.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(8116356., grad_fn=<MseLossBackward>)
output :  tensor([[108425.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(180837.5625, grad_fn=<MseLossBackward>)
output :  tensor([[264412.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(22135.8594, grad_fn=<MseLossBackward>)
output :  tensor([[251535.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2356800.7500, grad_fn=<MseLossBackward>)
output :  tensor([[121974.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1052515.7500, grad_fn=<MseLossBackward>)
output :  tensor([[216543.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4172e+09, grad_fn=<MseLossBackward>)
output :  tensor([[309495.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4977e+08, grad_fn=<MseLossBackward>)
output :  tensor([[204061.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(8632211., grad_fn=<MseLossBackward>)
output :  tensor([[215464.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5509e+10, grad_fn=<MseLossBackward>)
output :  tensor([[159501.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2565953.5000, grad_fn=<MseLossBackward>)
output :  tensor([[172048.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(4237937., grad_fn=<MseLossBackward>)
output :  tensor([[160777.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(14791115., grad_fn=<MseLossBackward>)
output :  tensor([[167299.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(7292616., grad_fn=<MseLossBackward>)
output :  tensor([[239314.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2287e+08, grad_fn=<MseLossBackward>)
output :  tensor([[219249.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0418e+08, grad_fn=<MseLossBackward>)
output :  tensor([[158835.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4007e+08, grad_fn=<MseLossBackward>)
output :  tensor([[121825.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(1379835.6250, grad_fn=<MseLossBackward>)
output :  tensor([[176187.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(659877., grad_fn=<MseLossBackward>)
output :  tensor([[181401.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1777e+09, grad_fn=<MseLossBackward>)
output :  tensor([[209241.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4364e+10, grad_fn=<MseLossBackward>)
output :  tensor([[130893.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(12520208., grad_fn=<MseLossBackward>)
output :  tensor([[146745.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3229e+08, grad_fn=<MseLossBackward>)
output :  tensor([[277942.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(887481.7500, grad_fn=<MseLossBackward>)
output :  tensor([[87814.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(7923609., grad_fn=<MseLossBackward>)
output :  tensor([[235195.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1701924.1250, grad_fn=<MseLossBackward>)
output :  tensor([[260786.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0378e+11, grad_fn=<MseLossBackward>)
output :  tensor([[171404.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1971523.1250, grad_fn=<MseLossBackward>)
output :  tensor([[193667.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7084e+09, grad_fn=<MseLossBackward>)
output :  tensor([[154595.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(163746.6875, grad_fn=<MseLossBackward>)
output :  tensor([[207542.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9010e+09, grad_fn=<MseLossBackward>)
output :  tensor([[127482.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(2303588.7500, grad_fn=<MseLossBackward>)
output :  tensor([[146332.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1775431.3750, grad_fn=<MseLossBackward>)
output :  tensor([[172622.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(9.0736e+08, grad_fn=<MseLossBackward>)
output :  tensor([[185530.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(101890.6328, grad_fn=<MseLossBackward>)
output :  tensor([[129474.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(12071010., grad_fn=<MseLossBackward>)
output :  tensor([[138314.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(3293657.7500, grad_fn=<MseLossBackward>)
output :  tensor([[176637.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(13232088., grad_fn=<MseLossBackward>)
output :  tensor([[198669.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6348e+09, grad_fn=<MseLossBackward>)
output :  tensor([[237884.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(26169140., grad_fn=<MseLossBackward>)
output :  tensor([[153670.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1766531.7500, grad_fn=<MseLossBackward>)
output :  tensor([[198079.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(4323020.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162026.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2496e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181369.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(3494971.7500, grad_fn=<MseLossBackward>)
output :  tensor([[180159.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(67178.1562, grad_fn=<MseLossBackward>)
output :  tensor([[98341.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(1798888.7500, grad_fn=<MseLossBackward>)
output :  tensor([[171949.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1675e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134584.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(172237.9688, grad_fn=<MseLossBackward>)
output :  tensor([[121256.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(39143108., grad_fn=<MseLossBackward>)
output :  tensor([[172461.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2366838., grad_fn=<MseLossBackward>)
output :  tensor([[84735.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(70200.1562, grad_fn=<MseLossBackward>)
output :  tensor([[283397.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(43590532., grad_fn=<MseLossBackward>)
output :  tensor([[165030.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(936.9338, grad_fn=<MseLossBackward>)
output :  tensor([[190100.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0468e+10, grad_fn=<MseLossBackward>)
output :  tensor([[247759.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4014e+08, grad_fn=<MseLossBackward>)
output :  tensor([[149218.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(3172684.5000, grad_fn=<MseLossBackward>)
output :  tensor([[122695.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1700823.5000, grad_fn=<MseLossBackward>)
output :  tensor([[122431.1016]], grad_fn=<AddmmBackward>)
loss:  tensor(6406475., grad_fn=<MseLossBackward>)
output :  tensor([[143803.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2964e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176212.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(4896193.5000, grad_fn=<MseLossBackward>)
output :  tensor([[109360.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2148e+08, grad_fn=<MseLossBackward>)
output :  tensor([[210507.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1555e+10, grad_fn=<MseLossBackward>)
output :  tensor([[238350.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(9922008., grad_fn=<MseLossBackward>)
output :  tensor([[250968.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0800e+10, grad_fn=<MseLossBackward>)
output :  tensor([[221121.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1963e+08, grad_fn=<MseLossBackward>)
output :  tensor([[195759.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4338e+10, grad_fn=<MseLossBackward>)
output :  tensor([[191898.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(19344328., grad_fn=<MseLossBackward>)
output :  tensor([[206509.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7681e+10, grad_fn=<MseLossBackward>)
output :  tensor([[190729.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1103e+10, grad_fn=<MseLossBackward>)
output :  tensor([[180116.]], grad_fn=<AddmmBackward>)
loss:  tensor(1893376., grad_fn=<MseLossBackward>)
output :  tensor([[152157.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(24870.2754, grad_fn=<MseLossBackward>)
output :  tensor([[338446.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2092271.8750, grad_fn=<MseLossBackward>)
output :  tensor([[208772.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(10418572., grad_fn=<MseLossBackward>)
output :  tensor([[158154.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(3407139.2500, grad_fn=<MseLossBackward>)
output :  tensor([[190303.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6211e+09, grad_fn=<MseLossBackward>)
output :  tensor([[101111.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(15123410., grad_fn=<MseLossBackward>)
output :  tensor([[276181.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7740e+10, grad_fn=<MseLossBackward>)
output :  tensor([[174132.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(54158.0156, grad_fn=<MseLossBackward>)
output :  tensor([[212825.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(455477.3438, grad_fn=<MseLossBackward>)
output :  tensor([[212329.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(75185160., grad_fn=<MseLossBackward>)
output :  tensor([[181609.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(5806142., grad_fn=<MseLossBackward>)
output :  tensor([[198042.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(14121037., grad_fn=<MseLossBackward>)
output :  tensor([[156299.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1687725.7500, grad_fn=<MseLossBackward>)
output :  tensor([[147631.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2687e+09, grad_fn=<MseLossBackward>)
output :  tensor([[119547.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1096438., grad_fn=<MseLossBackward>)
output :  tensor([[140559.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(312708.1250, grad_fn=<MseLossBackward>)
output :  tensor([[147055.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(3781384., grad_fn=<MseLossBackward>)
output :  tensor([[203499.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5500e+10, grad_fn=<MseLossBackward>)
output :  tensor([[162856.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(11263156., grad_fn=<MseLossBackward>)
output :  tensor([[99408.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(8299.4951, grad_fn=<MseLossBackward>)
output :  tensor([[225885.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9922e+08, grad_fn=<MseLossBackward>)
output :  tensor([[185609.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0438e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177895.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1988540.6250, grad_fn=<MseLossBackward>)
output :  tensor([[82856.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(734007.1875, grad_fn=<MseLossBackward>)
output :  tensor([[128314.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(34581.4688, grad_fn=<MseLossBackward>)
output :  tensor([[213028.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(944753.6250, grad_fn=<MseLossBackward>)
output :  tensor([[144679.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(461125.8750, grad_fn=<MseLossBackward>)
output :  tensor([[128785.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1474327.1250, grad_fn=<MseLossBackward>)
output :  tensor([[142627.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(745.1194, grad_fn=<MseLossBackward>)
output :  tensor([[176654.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5331e+09, grad_fn=<MseLossBackward>)
output :  tensor([[143511.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(238754.3906, grad_fn=<MseLossBackward>)
output :  tensor([[159616.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(146712.9375, grad_fn=<MseLossBackward>)
output :  tensor([[217142.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(4589703.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135538.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(9.3260e+08, grad_fn=<MseLossBackward>)
output :  tensor([[256990.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(3960722., grad_fn=<MseLossBackward>)
output :  tensor([[160549.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1102204.7500, grad_fn=<MseLossBackward>)
output :  tensor([[131062.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(6568328.5000, grad_fn=<MseLossBackward>)
output :  tensor([[96652.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2730859.5000, grad_fn=<MseLossBackward>)
output :  tensor([[151771.]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5254e+09, grad_fn=<MseLossBackward>)
output :  tensor([[178613.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1653836.2500, grad_fn=<MseLossBackward>)
output :  tensor([[118503.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3985887.5000, grad_fn=<MseLossBackward>)
output :  tensor([[192685.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3151e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144097.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1728e+09, grad_fn=<MseLossBackward>)
output :  tensor([[152078.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(4744024.5000, grad_fn=<MseLossBackward>)
output :  tensor([[187382.]], grad_fn=<AddmmBackward>)
loss:  tensor(135424., grad_fn=<MseLossBackward>)
output :  tensor([[250952.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7745e+09, grad_fn=<MseLossBackward>)
output :  tensor([[89892.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(2584031.2500, grad_fn=<MseLossBackward>)
output :  tensor([[237030.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(8816910., grad_fn=<MseLossBackward>)
output :  tensor([[128944.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(197483.0312, grad_fn=<MseLossBackward>)
output :  tensor([[164972.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0186e+10, grad_fn=<MseLossBackward>)
output :  tensor([[112113.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4674e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174824.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1381028.8750, grad_fn=<MseLossBackward>)
output :  tensor([[162492.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3328e+08, grad_fn=<MseLossBackward>)
output :  tensor([[155319.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1599e+08, grad_fn=<MseLossBackward>)
output :  tensor([[238561.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(192035.6719, grad_fn=<MseLossBackward>)
output :  tensor([[224968.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0911e+09, grad_fn=<MseLossBackward>)
output :  tensor([[126437.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(316520.5312, grad_fn=<MseLossBackward>)
output :  tensor([[127409.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1986205.7500, grad_fn=<MseLossBackward>)
output :  tensor([[226796.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(41469.5039, grad_fn=<MseLossBackward>)
output :  tensor([[229815.]], grad_fn=<AddmmBackward>)
loss:  tensor(17514224., grad_fn=<MseLossBackward>)
output :  tensor([[230835.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(17103006., grad_fn=<MseLossBackward>)
output :  tensor([[149187.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1410898.5000, grad_fn=<MseLossBackward>)
output :  tensor([[212993.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(8962071., grad_fn=<MseLossBackward>)
output :  tensor([[129131.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(83387432., grad_fn=<MseLossBackward>)
output :  tensor([[137525.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(25251568., grad_fn=<MseLossBackward>)
output :  tensor([[311864.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(9834300., grad_fn=<MseLossBackward>)
output :  tensor([[142946.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(3788314.7500, grad_fn=<MseLossBackward>)
output :  tensor([[120101.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8197e+09, grad_fn=<MseLossBackward>)
output :  tensor([[108000.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2247375.7500, grad_fn=<MseLossBackward>)
output :  tensor([[156177.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6643e+08, grad_fn=<MseLossBackward>)
output :  tensor([[182179.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5646e+09, grad_fn=<MseLossBackward>)
output :  tensor([[171155.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3402180.2500, grad_fn=<MseLossBackward>)
output :  tensor([[195952.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(25479780., grad_fn=<MseLossBackward>)
output :  tensor([[100874.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(765515.6250, grad_fn=<MseLossBackward>)
output :  tensor([[180601.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2564402., grad_fn=<MseLossBackward>)
output :  tensor([[167172.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(529824.7500, grad_fn=<MseLossBackward>)
output :  tensor([[139430.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(185693.6562, grad_fn=<MseLossBackward>)
output :  tensor([[259038.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0012e+10, grad_fn=<MseLossBackward>)
output :  tensor([[141125.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1501e+09, grad_fn=<MseLossBackward>)
output :  tensor([[175959.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(8756051., grad_fn=<MseLossBackward>)
output :  tensor([[141651.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2726059., grad_fn=<MseLossBackward>)
output :  tensor([[197436.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(9382448., grad_fn=<MseLossBackward>)
output :  tensor([[167563.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(5935771., grad_fn=<MseLossBackward>)
output :  tensor([[244638.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(407682.2500, grad_fn=<MseLossBackward>)
output :  tensor([[134003.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(246791.6094, grad_fn=<MseLossBackward>)
output :  tensor([[149986.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(405152.1562, grad_fn=<MseLossBackward>)
output :  tensor([[215282.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(79647.4219, grad_fn=<MseLossBackward>)
output :  tensor([[163825.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1380000.8750, grad_fn=<MseLossBackward>)
output :  tensor([[196986.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(63785928., grad_fn=<MseLossBackward>)
output :  tensor([[132021.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2783e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128943.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3144.7561, grad_fn=<MseLossBackward>)
output :  tensor([[134942.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(25582732., grad_fn=<MseLossBackward>)
output :  tensor([[203864.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3080e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166257.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6274e+09, grad_fn=<MseLossBackward>)
output :  tensor([[74355.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0607e+08, grad_fn=<MseLossBackward>)
output :  tensor([[93320.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(77799840., grad_fn=<MseLossBackward>)
output :  tensor([[259872.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(43286120., grad_fn=<MseLossBackward>)
output :  tensor([[203011.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0975e+09, grad_fn=<MseLossBackward>)
output :  tensor([[110873.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(17024778., grad_fn=<MseLossBackward>)
output :  tensor([[158502.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4087e+08, grad_fn=<MseLossBackward>)
output :  tensor([[206761.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7525e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181144.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8953e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158170.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(10049891., grad_fn=<MseLossBackward>)
output :  tensor([[169758.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(58111.1289, grad_fn=<MseLossBackward>)
output :  tensor([[115919.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(844718.9375, grad_fn=<MseLossBackward>)
output :  tensor([[159985.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(24856300., grad_fn=<MseLossBackward>)
output :  tensor([[193648.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7559e+08, grad_fn=<MseLossBackward>)
output :  tensor([[218517.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(965582.6250, grad_fn=<MseLossBackward>)
output :  tensor([[246708.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4829e+11, grad_fn=<MseLossBackward>)
output :  tensor([[148474.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(2174104.2500, grad_fn=<MseLossBackward>)
output :  tensor([[105979.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(6251953.5000, grad_fn=<MseLossBackward>)
output :  tensor([[169800.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4640e+08, grad_fn=<MseLossBackward>)
output :  tensor([[151267.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(589536.0625, grad_fn=<MseLossBackward>)
output :  tensor([[237486.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(236287.1406, grad_fn=<MseLossBackward>)
output :  tensor([[114994.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(30.6812, grad_fn=<MseLossBackward>)
output :  tensor([[180009.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(8357519.5000, grad_fn=<MseLossBackward>)
output :  tensor([[182564.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(17101068., grad_fn=<MseLossBackward>)
output :  tensor([[164108.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4302e+10, grad_fn=<MseLossBackward>)
output :  tensor([[97160.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6117e+08, grad_fn=<MseLossBackward>)
output :  tensor([[238700.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(89447.7266, grad_fn=<MseLossBackward>)
output :  tensor([[177648.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2716934., grad_fn=<MseLossBackward>)
output :  tensor([[141953.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(3814392., grad_fn=<MseLossBackward>)
output :  tensor([[234939.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3641.3682, grad_fn=<MseLossBackward>)
output :  tensor([[166429.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(11760506., grad_fn=<MseLossBackward>)
output :  tensor([[205375.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4310e+10, grad_fn=<MseLossBackward>)
output :  tensor([[136734.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(3008436., grad_fn=<MseLossBackward>)
output :  tensor([[187164.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3326e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137531.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2346976.2500, grad_fn=<MseLossBackward>)
output :  tensor([[228907.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(50297572., grad_fn=<MseLossBackward>)
output :  tensor([[227623.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0071e+08, grad_fn=<MseLossBackward>)
output :  tensor([[90353.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(124940.1562, grad_fn=<MseLossBackward>)
output :  tensor([[162140.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(7325311.5000, grad_fn=<MseLossBackward>)
output :  tensor([[246701.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5420e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145376.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(141540.5469, grad_fn=<MseLossBackward>)
output :  tensor([[111286.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9613e+09, grad_fn=<MseLossBackward>)
output :  tensor([[160770.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(13911851., grad_fn=<MseLossBackward>)
output :  tensor([[143789.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(44297.0938, grad_fn=<MseLossBackward>)
output :  tensor([[128378.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(31745.2168, grad_fn=<MseLossBackward>)
output :  tensor([[190149.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7404e+09, grad_fn=<MseLossBackward>)
output :  tensor([[123972.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2168256.2500, grad_fn=<MseLossBackward>)
output :  tensor([[151248.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(564306.1250, grad_fn=<MseLossBackward>)
output :  tensor([[171194.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(308597.6250, grad_fn=<MseLossBackward>)
output :  tensor([[151794.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(631553.0625, grad_fn=<MseLossBackward>)
output :  tensor([[160002.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(8393152., grad_fn=<MseLossBackward>)
output :  tensor([[136658.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6497e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133169.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1367620.6250, grad_fn=<MseLossBackward>)
output :  tensor([[153708.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1633e+08, grad_fn=<MseLossBackward>)
output :  tensor([[144848.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(485743.6562, grad_fn=<MseLossBackward>)
output :  tensor([[164767.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(9102855., grad_fn=<MseLossBackward>)
output :  tensor([[137890.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8344e+08, grad_fn=<MseLossBackward>)
output :  tensor([[149778.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(957523.4375, grad_fn=<MseLossBackward>)
output :  tensor([[185294.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(7320322., grad_fn=<MseLossBackward>)
output :  tensor([[168809.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(36439.2305, grad_fn=<MseLossBackward>)
output :  tensor([[180017.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(316.1729, grad_fn=<MseLossBackward>)
output :  tensor([[220978.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(957584.5625, grad_fn=<MseLossBackward>)
output :  tensor([[109625.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2977350.2500, grad_fn=<MseLossBackward>)
output :  tensor([[139163.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0344e+08, grad_fn=<MseLossBackward>)
output :  tensor([[286774.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(599414.6875, grad_fn=<MseLossBackward>)
output :  tensor([[122131.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(37598932., grad_fn=<MseLossBackward>)
output :  tensor([[177261.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8266e+09, grad_fn=<MseLossBackward>)
output :  tensor([[186317.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1736094.5000, grad_fn=<MseLossBackward>)
output :  tensor([[180997.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(20268848., grad_fn=<MseLossBackward>)
output :  tensor([[252941.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8656e+08, grad_fn=<MseLossBackward>)
output :  tensor([[216164.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(34049776., grad_fn=<MseLossBackward>)
output :  tensor([[124396.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4214e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174117.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4594e+08, grad_fn=<MseLossBackward>)
output :  tensor([[122214.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(3188875.2500, grad_fn=<MseLossBackward>)
output :  tensor([[183545.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5144e+10, grad_fn=<MseLossBackward>)
output :  tensor([[154041.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1085503.5000, grad_fn=<MseLossBackward>)
output :  tensor([[152725.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(38757432., grad_fn=<MseLossBackward>)
output :  tensor([[205447.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(726623.0625, grad_fn=<MseLossBackward>)
output :  tensor([[144302.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3931e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176782.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(611866.1875, grad_fn=<MseLossBackward>)
output :  tensor([[254797.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1023e+08, grad_fn=<MseLossBackward>)
output :  tensor([[147674.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(106214.8828, grad_fn=<MseLossBackward>)
output :  tensor([[201181.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2200262.2500, grad_fn=<MseLossBackward>)
output :  tensor([[164097.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(17204090., grad_fn=<MseLossBackward>)
output :  tensor([[123268.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2439e+09, grad_fn=<MseLossBackward>)
output :  tensor([[135344.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(164113.6094, grad_fn=<MseLossBackward>)
output :  tensor([[184524.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(274936.3750, grad_fn=<MseLossBackward>)
output :  tensor([[195773.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(33332040., grad_fn=<MseLossBackward>)
output :  tensor([[236390.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7678e+09, grad_fn=<MseLossBackward>)
output :  tensor([[256498.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(251126.2656, grad_fn=<MseLossBackward>)
output :  tensor([[188604.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7003e+10, grad_fn=<MseLossBackward>)
output :  tensor([[141523.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5024e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145365.]], grad_fn=<AddmmBackward>)
loss:  tensor(748225., grad_fn=<MseLossBackward>)
output :  tensor([[70823.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(9.5009e+08, grad_fn=<MseLossBackward>)
output :  tensor([[138398.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(11552245., grad_fn=<MseLossBackward>)
output :  tensor([[127602.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(1683445.3750, grad_fn=<MseLossBackward>)
output :  tensor([[154131.]], grad_fn=<AddmmBackward>)
loss:  tensor(17161., grad_fn=<MseLossBackward>)
output :  tensor([[127457.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(209592.2812, grad_fn=<MseLossBackward>)
output :  tensor([[77481.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(963081.5625, grad_fn=<MseLossBackward>)
output :  tensor([[87936.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(35239620., grad_fn=<MseLossBackward>)
output :  tensor([[225039.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(48454216., grad_fn=<MseLossBackward>)
output :  tensor([[139166.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1111e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129769.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(534223.9375, grad_fn=<MseLossBackward>)
output :  tensor([[168920.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(3687240., grad_fn=<MseLossBackward>)
output :  tensor([[234239.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(578859.4375, grad_fn=<MseLossBackward>)
output :  tensor([[187180.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(24597106., grad_fn=<MseLossBackward>)
output :  tensor([[156318.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(101621.4844, grad_fn=<MseLossBackward>)
output :  tensor([[199998.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(4402915.5000, grad_fn=<MseLossBackward>)
output :  tensor([[205939.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6476e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136728.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(73551.1328, grad_fn=<MseLossBackward>)
output :  tensor([[154197.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(644106.5625, grad_fn=<MseLossBackward>)
output :  tensor([[134698.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1693088.8750, grad_fn=<MseLossBackward>)
output :  tensor([[200873.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4833e+08, grad_fn=<MseLossBackward>)
output :  tensor([[156594.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(6733295., grad_fn=<MseLossBackward>)
output :  tensor([[134628.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6915e+09, grad_fn=<MseLossBackward>)
output :  tensor([[147797.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(8397589., grad_fn=<MseLossBackward>)
output :  tensor([[207335.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(21761350., grad_fn=<MseLossBackward>)
output :  tensor([[101957.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9831e+08, grad_fn=<MseLossBackward>)
output :  tensor([[164328.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(10058908., grad_fn=<MseLossBackward>)
output :  tensor([[129581.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2499709.2500, grad_fn=<MseLossBackward>)
output :  tensor([[146643.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(127014.2812, grad_fn=<MseLossBackward>)
output :  tensor([[98516.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3057e+09, grad_fn=<MseLossBackward>)
output :  tensor([[140094.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(6731106., grad_fn=<MseLossBackward>)
output :  tensor([[236701.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(492014.5625, grad_fn=<MseLossBackward>)
output :  tensor([[145443.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(197052.7656, grad_fn=<MseLossBackward>)
output :  tensor([[137293.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(42758.4844, grad_fn=<MseLossBackward>)
output :  tensor([[162884.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2169e+09, grad_fn=<MseLossBackward>)
output :  tensor([[269993.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(64108044., grad_fn=<MseLossBackward>)
output :  tensor([[172495.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(6274320.5000, grad_fn=<MseLossBackward>)
output :  tensor([[104006.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1514514.7500, grad_fn=<MseLossBackward>)
output :  tensor([[201948.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7080e+09, grad_fn=<MseLossBackward>)
output :  tensor([[153050.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(35400084., grad_fn=<MseLossBackward>)
output :  tensor([[163968.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5564e+10, grad_fn=<MseLossBackward>)
output :  tensor([[97842.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(208906.1250, grad_fn=<MseLossBackward>)
output :  tensor([[126050.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(6004988.5000, grad_fn=<MseLossBackward>)
output :  tensor([[157589.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2526063.2500, grad_fn=<MseLossBackward>)
output :  tensor([[141580.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2499116.2500, grad_fn=<MseLossBackward>)
output :  tensor([[200565.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(319383.9375, grad_fn=<MseLossBackward>)
output :  tensor([[142410.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(168895.3125, grad_fn=<MseLossBackward>)
output :  tensor([[265184.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(8433761., grad_fn=<MseLossBackward>)
output :  tensor([[127783.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2099e+09, grad_fn=<MseLossBackward>)
output :  tensor([[165817.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(100746.7266, grad_fn=<MseLossBackward>)
output :  tensor([[190479.]], grad_fn=<AddmmBackward>)
loss:  tensor(3916441., grad_fn=<MseLossBackward>)
output :  tensor([[121887.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4131e+08, grad_fn=<MseLossBackward>)
output :  tensor([[246360.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(13244027., grad_fn=<MseLossBackward>)
output :  tensor([[158970.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8566e+08, grad_fn=<MseLossBackward>)
output :  tensor([[243449.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(3611544., grad_fn=<MseLossBackward>)
output :  tensor([[145759.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(3094960.5000, grad_fn=<MseLossBackward>)
output :  tensor([[208761.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1534308., grad_fn=<MseLossBackward>)
output :  tensor([[173147.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(558055.6875, grad_fn=<MseLossBackward>)
output :  tensor([[153784.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(46319.1094, grad_fn=<MseLossBackward>)
output :  tensor([[115832.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(4699309.5000, grad_fn=<MseLossBackward>)
output :  tensor([[238239.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3864e+09, grad_fn=<MseLossBackward>)
output :  tensor([[238302.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2880180.2500, grad_fn=<MseLossBackward>)
output :  tensor([[155607.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(5154319., grad_fn=<MseLossBackward>)
output :  tensor([[251820.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(9480433., grad_fn=<MseLossBackward>)
output :  tensor([[124519.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0031e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179056.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(9343530., grad_fn=<MseLossBackward>)
output :  tensor([[163619.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(13102929., grad_fn=<MseLossBackward>)
output :  tensor([[129838.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1349154.8750, grad_fn=<MseLossBackward>)
output :  tensor([[194623.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2410e+09, grad_fn=<MseLossBackward>)
output :  tensor([[165031.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1063927.7500, grad_fn=<MseLossBackward>)
output :  tensor([[165914.]], grad_fn=<AddmmBackward>)
loss:  tensor(8491396., grad_fn=<MseLossBackward>)
output :  tensor([[158135.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(18377.1914, grad_fn=<MseLossBackward>)
output :  tensor([[144854.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(25456440., grad_fn=<MseLossBackward>)
output :  tensor([[173092.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0440e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163461.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(11983821., grad_fn=<MseLossBackward>)
output :  tensor([[377463.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(42340236., grad_fn=<MseLossBackward>)
output :  tensor([[124019.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(8882030., grad_fn=<MseLossBackward>)
output :  tensor([[128264.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8288e+09, grad_fn=<MseLossBackward>)
output :  tensor([[277078.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(17092282., grad_fn=<MseLossBackward>)
output :  tensor([[160804.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1429593.8750, grad_fn=<MseLossBackward>)
output :  tensor([[128714.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(67485200., grad_fn=<MseLossBackward>)
output :  tensor([[231815.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(34190.3203, grad_fn=<MseLossBackward>)
output :  tensor([[176619.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(15058765., grad_fn=<MseLossBackward>)
output :  tensor([[152048.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2390.2932, grad_fn=<MseLossBackward>)
output :  tensor([[147311.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(5344188., grad_fn=<MseLossBackward>)
output :  tensor([[155991.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6449e+08, grad_fn=<MseLossBackward>)
output :  tensor([[103119.4922]], grad_fn=<AddmmBackward>)
loss:  tensor(9731232., grad_fn=<MseLossBackward>)
output :  tensor([[74719.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1665e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163809.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1417997.2500, grad_fn=<MseLossBackward>)
output :  tensor([[190836.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3811e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157102.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(806375.9375, grad_fn=<MseLossBackward>)
output :  tensor([[159511.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4044623.7500, grad_fn=<MseLossBackward>)
output :  tensor([[136069.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1905737.1250, grad_fn=<MseLossBackward>)
output :  tensor([[207290.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1797903.8750, grad_fn=<MseLossBackward>)
output :  tensor([[138640.]], grad_fn=<AddmmBackward>)
loss:  tensor(409600., grad_fn=<MseLossBackward>)
output :  tensor([[181386.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6541e+10, grad_fn=<MseLossBackward>)
output :  tensor([[141204.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(22999668., grad_fn=<MseLossBackward>)
output :  tensor([[109906.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2395e+08, grad_fn=<MseLossBackward>)
output :  tensor([[96757.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(7602901.5000, grad_fn=<MseLossBackward>)
output :  tensor([[173584.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2004171.1250, grad_fn=<MseLossBackward>)
output :  tensor([[249825.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1181e+08, grad_fn=<MseLossBackward>)
output :  tensor([[140581.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(842953.5000, grad_fn=<MseLossBackward>)
output :  tensor([[160468.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(328651.4062, grad_fn=<MseLossBackward>)
output :  tensor([[130783.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2947713.5000, grad_fn=<MseLossBackward>)
output :  tensor([[147768.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2997172.5000, grad_fn=<MseLossBackward>)
output :  tensor([[172318.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(19526732., grad_fn=<MseLossBackward>)
output :  tensor([[125435.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(2448956., grad_fn=<MseLossBackward>)
output :  tensor([[173721.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2490e+08, grad_fn=<MseLossBackward>)
output :  tensor([[157856.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(733779.6250, grad_fn=<MseLossBackward>)
output :  tensor([[114351.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(4617294.5000, grad_fn=<MseLossBackward>)
output :  tensor([[159989.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3306e+09, grad_fn=<MseLossBackward>)
output :  tensor([[50594.9883]], grad_fn=<AddmmBackward>)
loss:  tensor(1974057.8750, grad_fn=<MseLossBackward>)
output :  tensor([[231976.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4841e+09, grad_fn=<MseLossBackward>)
output :  tensor([[199046.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(3815796., grad_fn=<MseLossBackward>)
output :  tensor([[183015.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3938612.2500, grad_fn=<MseLossBackward>)
output :  tensor([[106442.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(195923.8125, grad_fn=<MseLossBackward>)
output :  tensor([[87401.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(160938.8750, grad_fn=<MseLossBackward>)
output :  tensor([[134656.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(28551656., grad_fn=<MseLossBackward>)
output :  tensor([[222312.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1391e+09, grad_fn=<MseLossBackward>)
output :  tensor([[205183.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(5364145.5000, grad_fn=<MseLossBackward>)
output :  tensor([[166837.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3378186.5000, grad_fn=<MseLossBackward>)
output :  tensor([[173808.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3158e+09, grad_fn=<MseLossBackward>)
output :  tensor([[190485.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(236059.3281, grad_fn=<MseLossBackward>)
output :  tensor([[86113.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(786644.2500, grad_fn=<MseLossBackward>)
output :  tensor([[137996.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4012384.5000, grad_fn=<MseLossBackward>)
output :  tensor([[109719.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(608899.8125, grad_fn=<MseLossBackward>)
output :  tensor([[148176.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4924e+08, grad_fn=<MseLossBackward>)
output :  tensor([[171365.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6294e+09, grad_fn=<MseLossBackward>)
output :  tensor([[196535.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(71654376., grad_fn=<MseLossBackward>)
output :  tensor([[177902.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(4398130., grad_fn=<MseLossBackward>)
output :  tensor([[97203.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(495209.0938, grad_fn=<MseLossBackward>)
output :  tensor([[118211.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(505976.5938, grad_fn=<MseLossBackward>)
output :  tensor([[160773.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3947e+08, grad_fn=<MseLossBackward>)
output :  tensor([[198956.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1088501., grad_fn=<MseLossBackward>)
output :  tensor([[141573.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(5888357., grad_fn=<MseLossBackward>)
train_loss: [2.5659837e+09]
epoch_result tensor([0.])
output :  tensor([[159403.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(816848.8125, grad_fn=<MseLossBackward>)
output :  tensor([[118197.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(14456273., grad_fn=<MseLossBackward>)
output :  tensor([[195739.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2367799.7500, grad_fn=<MseLossBackward>)
output :  tensor([[178481.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2193407.2500, grad_fn=<MseLossBackward>)
output :  tensor([[153176.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1622e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128484.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(235081.0312, grad_fn=<MseLossBackward>)
output :  tensor([[140259.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(548085.7500, grad_fn=<MseLossBackward>)
output :  tensor([[116622.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(5653732., grad_fn=<MseLossBackward>)
output :  tensor([[64893.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(40873944., grad_fn=<MseLossBackward>)
output :  tensor([[165756.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(59246.6016, grad_fn=<MseLossBackward>)
output :  tensor([[142661.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(7081503., grad_fn=<MseLossBackward>)
output :  tensor([[225857.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(734582.9375, grad_fn=<MseLossBackward>)
output :  tensor([[171138.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(4574786.5000, grad_fn=<MseLossBackward>)
output :  tensor([[248171.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2336742.2500, grad_fn=<MseLossBackward>)
output :  tensor([[53728.0117]], grad_fn=<AddmmBackward>)
loss:  tensor(1617954.2500, grad_fn=<MseLossBackward>)
output :  tensor([[160086.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4295e+08, grad_fn=<MseLossBackward>)
output :  tensor([[184635.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(92838040., grad_fn=<MseLossBackward>)
output :  tensor([[164523.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(64373292., grad_fn=<MseLossBackward>)
output :  tensor([[275457.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(209106.1406, grad_fn=<MseLossBackward>)
output :  tensor([[194453.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(6484901., grad_fn=<MseLossBackward>)
output :  tensor([[138219.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5230e+10, grad_fn=<MseLossBackward>)
output :  tensor([[194557.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(460298.6562, grad_fn=<MseLossBackward>)
output :  tensor([[178502.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1527e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151697.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(486484.4688, grad_fn=<MseLossBackward>)
output :  tensor([[171918.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(3679982.7500, grad_fn=<MseLossBackward>)
output :  tensor([[84329.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(1145351.5000, grad_fn=<MseLossBackward>)
output :  tensor([[168919.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1270e+09, grad_fn=<MseLossBackward>)
output :  tensor([[180880.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(16967062., grad_fn=<MseLossBackward>)
output :  tensor([[206409.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4098e+09, grad_fn=<MseLossBackward>)
output :  tensor([[107344.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(7053091., grad_fn=<MseLossBackward>)
output :  tensor([[171560.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(314668.4062, grad_fn=<MseLossBackward>)
output :  tensor([[139607.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(9655003., grad_fn=<MseLossBackward>)
output :  tensor([[132421.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(11709549., grad_fn=<MseLossBackward>)
output :  tensor([[121140.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2691599., grad_fn=<MseLossBackward>)
output :  tensor([[144169.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3817e+08, grad_fn=<MseLossBackward>)
output :  tensor([[171827.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0498e+10, grad_fn=<MseLossBackward>)
output :  tensor([[153220.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(12393920., grad_fn=<MseLossBackward>)
output :  tensor([[182427.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(5893894., grad_fn=<MseLossBackward>)
output :  tensor([[143915.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(8500505., grad_fn=<MseLossBackward>)
output :  tensor([[108754.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5171e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135534.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3148e+09, grad_fn=<MseLossBackward>)
output :  tensor([[139234.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(17931388., grad_fn=<MseLossBackward>)
output :  tensor([[135993.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(80882760., grad_fn=<MseLossBackward>)
output :  tensor([[224224.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(601618.3750, grad_fn=<MseLossBackward>)
output :  tensor([[131655.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(353393.0938, grad_fn=<MseLossBackward>)
output :  tensor([[147207.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3212384., grad_fn=<MseLossBackward>)
output :  tensor([[104322.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(58944844., grad_fn=<MseLossBackward>)
output :  tensor([[160974.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(949254.3750, grad_fn=<MseLossBackward>)
output :  tensor([[148939.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1215e+09, grad_fn=<MseLossBackward>)
output :  tensor([[191537.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(214224.3438, grad_fn=<MseLossBackward>)
output :  tensor([[133470.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(958563.3750, grad_fn=<MseLossBackward>)
output :  tensor([[104943.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(25572538., grad_fn=<MseLossBackward>)
output :  tensor([[237021.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(9127857., grad_fn=<MseLossBackward>)
output :  tensor([[167306.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1329e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161358.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(5563701.5000, grad_fn=<MseLossBackward>)
output :  tensor([[203240.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8649e+10, grad_fn=<MseLossBackward>)
output :  tensor([[248598.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1110e+10, grad_fn=<MseLossBackward>)
output :  tensor([[146287.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(7768501.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135942.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(3772274.2500, grad_fn=<MseLossBackward>)
output :  tensor([[160046.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(25465742., grad_fn=<MseLossBackward>)
output :  tensor([[135234.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(27397374., grad_fn=<MseLossBackward>)
output :  tensor([[181927.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0954e+09, grad_fn=<MseLossBackward>)
output :  tensor([[184134.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1158.1260, grad_fn=<MseLossBackward>)
output :  tensor([[162971.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2164898.5000, grad_fn=<MseLossBackward>)
output :  tensor([[136748.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(39084964., grad_fn=<MseLossBackward>)
output :  tensor([[142421.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(6105.9570, grad_fn=<MseLossBackward>)
output :  tensor([[147289.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(5240021.5000, grad_fn=<MseLossBackward>)
output :  tensor([[173979.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3174e+09, grad_fn=<MseLossBackward>)
output :  tensor([[197123.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9506e+08, grad_fn=<MseLossBackward>)
output :  tensor([[139334.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(8034656., grad_fn=<MseLossBackward>)
output :  tensor([[174082.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(4764807., grad_fn=<MseLossBackward>)
output :  tensor([[178885.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(4471110., grad_fn=<MseLossBackward>)
output :  tensor([[118817.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(14572710., grad_fn=<MseLossBackward>)
output :  tensor([[218923.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(4312890.5000, grad_fn=<MseLossBackward>)
output :  tensor([[180107.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(11506300., grad_fn=<MseLossBackward>)
output :  tensor([[127128.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2652063.2500, grad_fn=<MseLossBackward>)
output :  tensor([[198106.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2580992.7500, grad_fn=<MseLossBackward>)
output :  tensor([[173497.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1967532.2500, grad_fn=<MseLossBackward>)
output :  tensor([[211184.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0648e+10, grad_fn=<MseLossBackward>)
output :  tensor([[208804.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(4819191., grad_fn=<MseLossBackward>)
output :  tensor([[165963.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2224e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194094.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(164658.4219, grad_fn=<MseLossBackward>)
output :  tensor([[111167.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(3358142.2500, grad_fn=<MseLossBackward>)
output :  tensor([[112805.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(93368.4375, grad_fn=<MseLossBackward>)
output :  tensor([[112584.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(342161.0312, grad_fn=<MseLossBackward>)
output :  tensor([[145509.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1666035.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163163.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2213e+10, grad_fn=<MseLossBackward>)
output :  tensor([[177391.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(6802316., grad_fn=<MseLossBackward>)
output :  tensor([[128814.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1728773., grad_fn=<MseLossBackward>)
output :  tensor([[143559.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2075355.3750, grad_fn=<MseLossBackward>)
output :  tensor([[180505.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0798e+09, grad_fn=<MseLossBackward>)
output :  tensor([[117029.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(16669.2305, grad_fn=<MseLossBackward>)
output :  tensor([[196270.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(531577.6875, grad_fn=<MseLossBackward>)
output :  tensor([[145333.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(111065.9766, grad_fn=<MseLossBackward>)
output :  tensor([[214015.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1243712.8750, grad_fn=<MseLossBackward>)
output :  tensor([[127188.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1412680.8750, grad_fn=<MseLossBackward>)
output :  tensor([[248562.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(55166.2656, grad_fn=<MseLossBackward>)
output :  tensor([[241330.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9070e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145024.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8561e+08, grad_fn=<MseLossBackward>)
output :  tensor([[87647.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1009e+08, grad_fn=<MseLossBackward>)
output :  tensor([[194947.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3924e+09, grad_fn=<MseLossBackward>)
output :  tensor([[77397.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(12977500., grad_fn=<MseLossBackward>)
output :  tensor([[140226.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(527597.9375, grad_fn=<MseLossBackward>)
output :  tensor([[76917.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2009572., grad_fn=<MseLossBackward>)
output :  tensor([[142124.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(685635.7500, grad_fn=<MseLossBackward>)
output :  tensor([[175286.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(509662.1250, grad_fn=<MseLossBackward>)
output :  tensor([[152741.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(575915., grad_fn=<MseLossBackward>)
output :  tensor([[109801.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(5766564.5000, grad_fn=<MseLossBackward>)
output :  tensor([[203557.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2587e+10, grad_fn=<MseLossBackward>)
output :  tensor([[129219.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(517691.5000, grad_fn=<MseLossBackward>)
output :  tensor([[272272.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(59713772., grad_fn=<MseLossBackward>)
output :  tensor([[304557.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(29618766., grad_fn=<MseLossBackward>)
output :  tensor([[112184.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(21949006., grad_fn=<MseLossBackward>)
output :  tensor([[169815.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(7208637.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135719.]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6834e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135101.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(15198668., grad_fn=<MseLossBackward>)
output :  tensor([[133236.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(8921142., grad_fn=<MseLossBackward>)
output :  tensor([[129063.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(16508667., grad_fn=<MseLossBackward>)
output :  tensor([[134470.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2351e+08, grad_fn=<MseLossBackward>)
output :  tensor([[226734.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8520e+10, grad_fn=<MseLossBackward>)
output :  tensor([[188862.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3146e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144792.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(797421.1250, grad_fn=<MseLossBackward>)
output :  tensor([[131145.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(13288189., grad_fn=<MseLossBackward>)
output :  tensor([[109020.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(4972656., grad_fn=<MseLossBackward>)
output :  tensor([[258425.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5564e+09, grad_fn=<MseLossBackward>)
output :  tensor([[138252.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(10581501., grad_fn=<MseLossBackward>)
output :  tensor([[202282.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(514537.2188, grad_fn=<MseLossBackward>)
output :  tensor([[105977.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1161444., grad_fn=<MseLossBackward>)
output :  tensor([[138626.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1750701.1250, grad_fn=<MseLossBackward>)
output :  tensor([[209389.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2834e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180249.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(121844.6250, grad_fn=<MseLossBackward>)
output :  tensor([[186231.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1516553.7500, grad_fn=<MseLossBackward>)
output :  tensor([[163431.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1190e+10, grad_fn=<MseLossBackward>)
output :  tensor([[299191.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2823e+09, grad_fn=<MseLossBackward>)
output :  tensor([[197500.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(159512.8750, grad_fn=<MseLossBackward>)
output :  tensor([[255737.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1645e+10, grad_fn=<MseLossBackward>)
output :  tensor([[223154.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8357e+09, grad_fn=<MseLossBackward>)
output :  tensor([[284271.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0712e+09, grad_fn=<MseLossBackward>)
output :  tensor([[223636.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(132393.6406, grad_fn=<MseLossBackward>)
output :  tensor([[223194.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8495e+10, grad_fn=<MseLossBackward>)
output :  tensor([[196423.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(332406.3125, grad_fn=<MseLossBackward>)
output :  tensor([[159897.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(9.5463e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133978.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2186655.2500, grad_fn=<MseLossBackward>)
output :  tensor([[133629.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(3497133.7500, grad_fn=<MseLossBackward>)
output :  tensor([[92004.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1008643.6250, grad_fn=<MseLossBackward>)
output :  tensor([[105989.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(4042518.7500, grad_fn=<MseLossBackward>)
output :  tensor([[275025.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9024e+09, grad_fn=<MseLossBackward>)
output :  tensor([[229997.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(25025476., grad_fn=<MseLossBackward>)
output :  tensor([[146471.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2164806.5000, grad_fn=<MseLossBackward>)
output :  tensor([[137530.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(911.2852, grad_fn=<MseLossBackward>)
output :  tensor([[176849.]], grad_fn=<AddmmBackward>)
loss:  tensor(9709456., grad_fn=<MseLossBackward>)
output :  tensor([[150453.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(27076088., grad_fn=<MseLossBackward>)
output :  tensor([[165951.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1502e+08, grad_fn=<MseLossBackward>)
output :  tensor([[167630.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(6921750., grad_fn=<MseLossBackward>)
output :  tensor([[135648.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1826847.8750, grad_fn=<MseLossBackward>)
output :  tensor([[189770.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5253e+09, grad_fn=<MseLossBackward>)
output :  tensor([[114868.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(8229413., grad_fn=<MseLossBackward>)
output :  tensor([[167883.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(16946602., grad_fn=<MseLossBackward>)
output :  tensor([[120228.1016]], grad_fn=<AddmmBackward>)
loss:  tensor(52030.3242, grad_fn=<MseLossBackward>)
output :  tensor([[86614.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(148351.3594, grad_fn=<MseLossBackward>)
output :  tensor([[180497.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(247335.2656, grad_fn=<MseLossBackward>)
output :  tensor([[112526.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(6896861., grad_fn=<MseLossBackward>)
output :  tensor([[234692.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(18556710., grad_fn=<MseLossBackward>)
output :  tensor([[244864.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(18305.2441, grad_fn=<MseLossBackward>)
output :  tensor([[132162.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(7087492., grad_fn=<MseLossBackward>)
output :  tensor([[107279.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(2820484., grad_fn=<MseLossBackward>)
output :  tensor([[287671.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2345e+10, grad_fn=<MseLossBackward>)
output :  tensor([[170294.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1452815.8750, grad_fn=<MseLossBackward>)
output :  tensor([[127383.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(5682487.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140978.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2800e+08, grad_fn=<MseLossBackward>)
output :  tensor([[203260.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1533e+08, grad_fn=<MseLossBackward>)
output :  tensor([[143946.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(8679468., grad_fn=<MseLossBackward>)
output :  tensor([[159852.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4435e+10, grad_fn=<MseLossBackward>)
output :  tensor([[152440.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2129273.7500, grad_fn=<MseLossBackward>)
output :  tensor([[131459.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(3838293.2500, grad_fn=<MseLossBackward>)
output :  tensor([[248953.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6782e+10, grad_fn=<MseLossBackward>)
output :  tensor([[398170.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(14661720., grad_fn=<MseLossBackward>)
output :  tensor([[113961.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(24614776., grad_fn=<MseLossBackward>)
output :  tensor([[114710.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(14359008., grad_fn=<MseLossBackward>)
output :  tensor([[161606.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(4435433.5000, grad_fn=<MseLossBackward>)
output :  tensor([[130982.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2981e+08, grad_fn=<MseLossBackward>)
output :  tensor([[161814.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6223e+09, grad_fn=<MseLossBackward>)
output :  tensor([[171270.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7541e+09, grad_fn=<MseLossBackward>)
output :  tensor([[105946.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(5508299., grad_fn=<MseLossBackward>)
output :  tensor([[139882.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1248282.5000, grad_fn=<MseLossBackward>)
output :  tensor([[361893.]], grad_fn=<AddmmBackward>)
loss:  tensor(29170800., grad_fn=<MseLossBackward>)
output :  tensor([[208156.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1017e+09, grad_fn=<MseLossBackward>)
output :  tensor([[178341.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(8075010., grad_fn=<MseLossBackward>)
output :  tensor([[200020.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(8289630.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138847.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(23280.0840, grad_fn=<MseLossBackward>)
output :  tensor([[195617.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1247723.8750, grad_fn=<MseLossBackward>)
output :  tensor([[135565.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8765e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177554.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(11870394., grad_fn=<MseLossBackward>)
output :  tensor([[240945.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1112596.5000, grad_fn=<MseLossBackward>)
output :  tensor([[171541.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(6045835.5000, grad_fn=<MseLossBackward>)
output :  tensor([[107963.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1355.1602, grad_fn=<MseLossBackward>)
output :  tensor([[264887.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(106296.3750, grad_fn=<MseLossBackward>)
output :  tensor([[261714.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3722e+08, grad_fn=<MseLossBackward>)
output :  tensor([[126582.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(12835818., grad_fn=<MseLossBackward>)
output :  tensor([[218082.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2396e+09, grad_fn=<MseLossBackward>)
output :  tensor([[308721.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7485e+08, grad_fn=<MseLossBackward>)
output :  tensor([[210691.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(13627980., grad_fn=<MseLossBackward>)
output :  tensor([[214397.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5776e+10, grad_fn=<MseLossBackward>)
output :  tensor([[157525.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(140109.8438, grad_fn=<MseLossBackward>)
output :  tensor([[169301.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(473903.1562, grad_fn=<MseLossBackward>)
output :  tensor([[157594.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(438616.4688, grad_fn=<MseLossBackward>)
output :  tensor([[173195.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(10212718., grad_fn=<MseLossBackward>)
output :  tensor([[238439.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7384e+08, grad_fn=<MseLossBackward>)
output :  tensor([[224022.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(29521564., grad_fn=<MseLossBackward>)
output :  tensor([[161936.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2309e+08, grad_fn=<MseLossBackward>)
output :  tensor([[124975.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(3901550.7500, grad_fn=<MseLossBackward>)
output :  tensor([[178032.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1065056.2500, grad_fn=<MseLossBackward>)
output :  tensor([[180598.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3046e+09, grad_fn=<MseLossBackward>)
output :  tensor([[208607.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4599e+10, grad_fn=<MseLossBackward>)
output :  tensor([[133754.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(459239.1562, grad_fn=<MseLossBackward>)
output :  tensor([[146791.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3461e+08, grad_fn=<MseLossBackward>)
output :  tensor([[271286.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(32645154., grad_fn=<MseLossBackward>)
output :  tensor([[88598.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(12949202., grad_fn=<MseLossBackward>)
output :  tensor([[239192.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(7248546.5000, grad_fn=<MseLossBackward>)
output :  tensor([[260796.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0377e+11, grad_fn=<MseLossBackward>)
output :  tensor([[170588.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(345946.1562, grad_fn=<MseLossBackward>)
output :  tensor([[194832.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6134e+09, grad_fn=<MseLossBackward>)
output :  tensor([[154909.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(8275.3135, grad_fn=<MseLossBackward>)
output :  tensor([[206595.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0201e+09, grad_fn=<MseLossBackward>)
output :  tensor([[125951.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(9292781., grad_fn=<MseLossBackward>)
output :  tensor([[144750.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(62445.3242, grad_fn=<MseLossBackward>)
output :  tensor([[171193.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2332e+08, grad_fn=<MseLossBackward>)
output :  tensor([[188047.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4826877.5000, grad_fn=<MseLossBackward>)
output :  tensor([[125928.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(5067.6602, grad_fn=<MseLossBackward>)
output :  tensor([[140566.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(16532737., grad_fn=<MseLossBackward>)
output :  tensor([[175656.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(7057739.5000, grad_fn=<MseLossBackward>)
output :  tensor([[199423.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5579e+09, grad_fn=<MseLossBackward>)
output :  tensor([[239539.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(11978088., grad_fn=<MseLossBackward>)
output :  tensor([[155321.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(103573.3438, grad_fn=<MseLossBackward>)
output :  tensor([[197051.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1106441., grad_fn=<MseLossBackward>)
output :  tensor([[160135.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6037e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179405.]], grad_fn=<AddmmBackward>)
loss:  tensor(9025., grad_fn=<MseLossBackward>)
output :  tensor([[177100.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(7837812.5000, grad_fn=<MseLossBackward>)
output :  tensor([[97003.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(10.1104, grad_fn=<MseLossBackward>)
output :  tensor([[174180.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1198e+10, grad_fn=<MseLossBackward>)
output :  tensor([[138786.]], grad_fn=<AddmmBackward>)
loss:  tensor(14333796., grad_fn=<MseLossBackward>)
output :  tensor([[119237.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(17960446., grad_fn=<MseLossBackward>)
output :  tensor([[168539.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(29815354., grad_fn=<MseLossBackward>)
output :  tensor([[88901.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(15221032., grad_fn=<MseLossBackward>)
output :  tensor([[292868.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(8227754.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163995.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1009868., grad_fn=<MseLossBackward>)
output :  tensor([[191805.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9983e+10, grad_fn=<MseLossBackward>)
output :  tensor([[248628.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0049e+08, grad_fn=<MseLossBackward>)
output :  tensor([[150713.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(81903.2812, grad_fn=<MseLossBackward>)
output :  tensor([[123492.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(257754.5312, grad_fn=<MseLossBackward>)
output :  tensor([[117205.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(7262519.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144119.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4797e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172435.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2447024.7500, grad_fn=<MseLossBackward>)
output :  tensor([[108969.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0062e+08, grad_fn=<MseLossBackward>)
output :  tensor([[211410.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1361e+10, grad_fn=<MseLossBackward>)
output :  tensor([[240986.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(263890.9062, grad_fn=<MseLossBackward>)
output :  tensor([[254706.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9736e+10, grad_fn=<MseLossBackward>)
output :  tensor([[223214.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4920e+08, grad_fn=<MseLossBackward>)
output :  tensor([[197438.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3939e+10, grad_fn=<MseLossBackward>)
output :  tensor([[189369.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(3495380.7500, grad_fn=<MseLossBackward>)
output :  tensor([[205843.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7973e+10, grad_fn=<MseLossBackward>)
output :  tensor([[190162.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1269e+10, grad_fn=<MseLossBackward>)
output :  tensor([[177095.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2704740., grad_fn=<MseLossBackward>)
output :  tensor([[151749.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(62977.4727, grad_fn=<MseLossBackward>)
output :  tensor([[335530.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2160716.2500, grad_fn=<MseLossBackward>)
output :  tensor([[209019.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(8881797., grad_fn=<MseLossBackward>)
output :  tensor([[161165.]], grad_fn=<AddmmBackward>)
loss:  tensor(1357225., grad_fn=<MseLossBackward>)
output :  tensor([[188601.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7983e+09, grad_fn=<MseLossBackward>)
output :  tensor([[105368.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(135844.0781, grad_fn=<MseLossBackward>)
output :  tensor([[275744.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7983e+10, grad_fn=<MseLossBackward>)
output :  tensor([[170216.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(13571280., grad_fn=<MseLossBackward>)
output :  tensor([[214437.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(879316.4375, grad_fn=<MseLossBackward>)
output :  tensor([[213799.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(51841352., grad_fn=<MseLossBackward>)
output :  tensor([[175167.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(16260930., grad_fn=<MseLossBackward>)
output :  tensor([[201433.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(134093.2812, grad_fn=<MseLossBackward>)
output :  tensor([[155920.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(847205.1875, grad_fn=<MseLossBackward>)
output :  tensor([[146530.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1651e+09, grad_fn=<MseLossBackward>)
output :  tensor([[119253.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(568221.5000, grad_fn=<MseLossBackward>)
output :  tensor([[137501.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(6241331., grad_fn=<MseLossBackward>)
output :  tensor([[148600.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(159537.8281, grad_fn=<MseLossBackward>)
output :  tensor([[201076.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6110e+10, grad_fn=<MseLossBackward>)
output :  tensor([[160761.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1591776.5000, grad_fn=<MseLossBackward>)
output :  tensor([[99515.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(235.1910, grad_fn=<MseLossBackward>)
output :  tensor([[226380.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8548e+08, grad_fn=<MseLossBackward>)
output :  tensor([[184437.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5862e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173988.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(6231654., grad_fn=<MseLossBackward>)
output :  tensor([[80390.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2588981.5000, grad_fn=<MseLossBackward>)
output :  tensor([[129853.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1832004.5000, grad_fn=<MseLossBackward>)
output :  tensor([[218036.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(16296864., grad_fn=<MseLossBackward>)
output :  tensor([[142826.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1377872.5000, grad_fn=<MseLossBackward>)
output :  tensor([[134469.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(19973358., grad_fn=<MseLossBackward>)
output :  tensor([[141248.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1826214.3750, grad_fn=<MseLossBackward>)
output :  tensor([[175875.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4727e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146460.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(6055521.5000, grad_fn=<MseLossBackward>)
output :  tensor([[159701.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(89326.2656, grad_fn=<MseLossBackward>)
output :  tensor([[212620.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(5663730.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135406.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2457e+08, grad_fn=<MseLossBackward>)
output :  tensor([[259158.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(17292862., grad_fn=<MseLossBackward>)
output :  tensor([[158550.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(901609.6250, grad_fn=<MseLossBackward>)
output :  tensor([[130836.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(5457261., grad_fn=<MseLossBackward>)
output :  tensor([[96094.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1198032.8750, grad_fn=<MseLossBackward>)
output :  tensor([[154467.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8954e+09, grad_fn=<MseLossBackward>)
output :  tensor([[180943.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1089414., grad_fn=<MseLossBackward>)
output :  tensor([[120233.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(71130.5547, grad_fn=<MseLossBackward>)
output :  tensor([[191031.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4378e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145247.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3227e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150404.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(254299.5781, grad_fn=<MseLossBackward>)
output :  tensor([[188271.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(272076.3438, grad_fn=<MseLossBackward>)
output :  tensor([[254121.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5175e+09, grad_fn=<MseLossBackward>)
output :  tensor([[89585.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(3666626.5000, grad_fn=<MseLossBackward>)
output :  tensor([[239326.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(453034.1562, grad_fn=<MseLossBackward>)
output :  tensor([[128395.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(11015.1582, grad_fn=<MseLossBackward>)
output :  tensor([[166095.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9609e+09, grad_fn=<MseLossBackward>)
output :  tensor([[112736.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6221e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177633.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2668373.2500, grad_fn=<MseLossBackward>)
output :  tensor([[163392.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7562e+08, grad_fn=<MseLossBackward>)
output :  tensor([[153932.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4907e+08, grad_fn=<MseLossBackward>)
output :  tensor([[235635.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(11322068., grad_fn=<MseLossBackward>)
output :  tensor([[224138.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1466e+09, grad_fn=<MseLossBackward>)
output :  tensor([[125916.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(1173481.3750, grad_fn=<MseLossBackward>)
output :  tensor([[128126.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(4524096., grad_fn=<MseLossBackward>)
output :  tensor([[224458.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(6460096., grad_fn=<MseLossBackward>)
output :  tensor([[231498.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(6257267.5000, grad_fn=<MseLossBackward>)
output :  tensor([[225773.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(857852.2500, grad_fn=<MseLossBackward>)
output :  tensor([[144733.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(10667368., grad_fn=<MseLossBackward>)
output :  tensor([[212540.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(6455807.5000, grad_fn=<MseLossBackward>)
output :  tensor([[130265.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0538e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137683.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(26870454., grad_fn=<MseLossBackward>)
output :  tensor([[311135.]], grad_fn=<AddmmBackward>)
loss:  tensor(14938225., grad_fn=<MseLossBackward>)
output :  tensor([[135422.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(31111644., grad_fn=<MseLossBackward>)
output :  tensor([[120070.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8165e+09, grad_fn=<MseLossBackward>)
output :  tensor([[107775.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2975409.5000, grad_fn=<MseLossBackward>)
output :  tensor([[156834.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4541e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181117.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7624e+09, grad_fn=<MseLossBackward>)
output :  tensor([[172428.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(326058.8438, grad_fn=<MseLossBackward>)
output :  tensor([[195476.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(30504738., grad_fn=<MseLossBackward>)
output :  tensor([[98692.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1710046.6250, grad_fn=<MseLossBackward>)
output :  tensor([[175405.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(12918858., grad_fn=<MseLossBackward>)
output :  tensor([[169474.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2479444., grad_fn=<MseLossBackward>)
output :  tensor([[141653.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(7040979.5000, grad_fn=<MseLossBackward>)
output :  tensor([[264641.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(8.9225e+09, grad_fn=<MseLossBackward>)
output :  tensor([[140790.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1126e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173913.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(835338.8750, grad_fn=<MseLossBackward>)
output :  tensor([[145009.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(25096342., grad_fn=<MseLossBackward>)
output :  tensor([[201915.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2004790.5000, grad_fn=<MseLossBackward>)
output :  tensor([[169973.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(694.8167, grad_fn=<MseLossBackward>)
output :  tensor([[243680.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(101960.4688, grad_fn=<MseLossBackward>)
output :  tensor([[133527.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(945969., grad_fn=<MseLossBackward>)
output :  tensor([[149607.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(66338.4375, grad_fn=<MseLossBackward>)
output :  tensor([[214513.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(236347.9062, grad_fn=<MseLossBackward>)
output :  tensor([[167466.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(6083005.5000, grad_fn=<MseLossBackward>)
output :  tensor([[194428.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(29473532., grad_fn=<MseLossBackward>)
output :  tensor([[132221.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1707e+08, grad_fn=<MseLossBackward>)
output :  tensor([[132803.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(14463997., grad_fn=<MseLossBackward>)
output :  tensor([[138996.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1006980.8750, grad_fn=<MseLossBackward>)
output :  tensor([[204336.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2462e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166017.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6028e+09, grad_fn=<MseLossBackward>)
output :  tensor([[74422.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0800e+08, grad_fn=<MseLossBackward>)
output :  tensor([[92575.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(65208276., grad_fn=<MseLossBackward>)
output :  tensor([[249871.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(11703455., grad_fn=<MseLossBackward>)
output :  tensor([[203677.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1832e+09, grad_fn=<MseLossBackward>)
output :  tensor([[116570.1016]], grad_fn=<AddmmBackward>)
loss:  tensor(2465219., grad_fn=<MseLossBackward>)
output :  tensor([[157588.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(8.9468e+08, grad_fn=<MseLossBackward>)
output :  tensor([[210798.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(84670480., grad_fn=<MseLossBackward>)
output :  tensor([[182135.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7201e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157915.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(8500596., grad_fn=<MseLossBackward>)
output :  tensor([[169228.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(595839.2500, grad_fn=<MseLossBackward>)
output :  tensor([[116626.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(2644104.7500, grad_fn=<MseLossBackward>)
output :  tensor([[160452.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(29725496., grad_fn=<MseLossBackward>)
output :  tensor([[192686.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0201e+08, grad_fn=<MseLossBackward>)
output :  tensor([[223562.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(16501494., grad_fn=<MseLossBackward>)
output :  tensor([[247871.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4714e+11, grad_fn=<MseLossBackward>)
output :  tensor([[148246.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1552710.7500, grad_fn=<MseLossBackward>)
output :  tensor([[109913.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(2054765.5000, grad_fn=<MseLossBackward>)
output :  tensor([[170973.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1939e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148236.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(5122583.5000, grad_fn=<MseLossBackward>)
output :  tensor([[231690.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(28186476., grad_fn=<MseLossBackward>)
output :  tensor([[119365.]], grad_fn=<AddmmBackward>)
loss:  tensor(19053224., grad_fn=<MseLossBackward>)
output :  tensor([[184755.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(3441778.7500, grad_fn=<MseLossBackward>)
output :  tensor([[184783.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(3671475.2500, grad_fn=<MseLossBackward>)
output :  tensor([[161605.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5089e+10, grad_fn=<MseLossBackward>)
output :  tensor([[95482.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0974e+08, grad_fn=<MseLossBackward>)
output :  tensor([[244993.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(35926724., grad_fn=<MseLossBackward>)
output :  tensor([[176666.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(444368.0625, grad_fn=<MseLossBackward>)
output :  tensor([[138087.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(3659270., grad_fn=<MseLossBackward>)
output :  tensor([[234474.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(275690.6250, grad_fn=<MseLossBackward>)
output :  tensor([[161378.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2628299.5000, grad_fn=<MseLossBackward>)
output :  tensor([[205526.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4274e+10, grad_fn=<MseLossBackward>)
output :  tensor([[135716.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(513596.1875, grad_fn=<MseLossBackward>)
output :  tensor([[186442.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9744e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136875.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(766117.2500, grad_fn=<MseLossBackward>)
output :  tensor([[227149.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(78333008., grad_fn=<MseLossBackward>)
output :  tensor([[228626.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5683e+08, grad_fn=<MseLossBackward>)
output :  tensor([[92344.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(5496314., grad_fn=<MseLossBackward>)
output :  tensor([[162795.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(11299577., grad_fn=<MseLossBackward>)
output :  tensor([[248112.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5071e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144583.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(173797.7969, grad_fn=<MseLossBackward>)
output :  tensor([[112160.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0395e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163889.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(372996.4688, grad_fn=<MseLossBackward>)
output :  tensor([[148545.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(20659866., grad_fn=<MseLossBackward>)
output :  tensor([[127944.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(65488.0078, grad_fn=<MseLossBackward>)
output :  tensor([[187786.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0714e+09, grad_fn=<MseLossBackward>)
output :  tensor([[125169.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(7127648.5000, grad_fn=<MseLossBackward>)
output :  tensor([[154474.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(6122145., grad_fn=<MseLossBackward>)
output :  tensor([[171561.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(35579.3906, grad_fn=<MseLossBackward>)
output :  tensor([[148683.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(5366027.5000, grad_fn=<MseLossBackward>)
output :  tensor([[160569.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(5432687., grad_fn=<MseLossBackward>)
output :  tensor([[135269.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9008e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133152.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1328472.3750, grad_fn=<MseLossBackward>)
output :  tensor([[153928.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2285e+08, grad_fn=<MseLossBackward>)
output :  tensor([[146364.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(4896055., grad_fn=<MseLossBackward>)
output :  tensor([[163299.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2401725., grad_fn=<MseLossBackward>)
output :  tensor([[140082.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(9.1099e+08, grad_fn=<MseLossBackward>)
output :  tensor([[147933.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(750605.6250, grad_fn=<MseLossBackward>)
output :  tensor([[189591.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2532524., grad_fn=<MseLossBackward>)
output :  tensor([[171673.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(7148855.5000, grad_fn=<MseLossBackward>)
output :  tensor([[179437.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(316089.9375, grad_fn=<MseLossBackward>)
output :  tensor([[222106.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(4437342., grad_fn=<MseLossBackward>)
output :  tensor([[111415.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(12356323., grad_fn=<MseLossBackward>)
output :  tensor([[135671.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1602e+08, grad_fn=<MseLossBackward>)
output :  tensor([[282398.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(12970802., grad_fn=<MseLossBackward>)
output :  tensor([[119632.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(13197667., grad_fn=<MseLossBackward>)
output :  tensor([[179831.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6135e+09, grad_fn=<MseLossBackward>)
output :  tensor([[188367.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(11341424., grad_fn=<MseLossBackward>)
output :  tensor([[190732.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(27381018., grad_fn=<MseLossBackward>)
output :  tensor([[251293.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6201e+08, grad_fn=<MseLossBackward>)
output :  tensor([[220396.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2570009.7500, grad_fn=<MseLossBackward>)
output :  tensor([[124463.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4461e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174099.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4519e+08, grad_fn=<MseLossBackward>)
output :  tensor([[126843.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(8083049., grad_fn=<MseLossBackward>)
output :  tensor([[183846.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4991e+10, grad_fn=<MseLossBackward>)
output :  tensor([[149838.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(9998046., grad_fn=<MseLossBackward>)
output :  tensor([[154577.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(65250804., grad_fn=<MseLossBackward>)
output :  tensor([[201816.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(20099110., grad_fn=<MseLossBackward>)
output :  tensor([[145436.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6736e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174450.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2401434.5000, grad_fn=<MseLossBackward>)
output :  tensor([[252816.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1200e+08, grad_fn=<MseLossBackward>)
output :  tensor([[149320.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1744215.5000, grad_fn=<MseLossBackward>)
output :  tensor([[201423.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1540856.7500, grad_fn=<MseLossBackward>)
output :  tensor([[160742.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(627957.1875, grad_fn=<MseLossBackward>)
output :  tensor([[119739.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0074e+09, grad_fn=<MseLossBackward>)
output :  tensor([[139443.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(13641827., grad_fn=<MseLossBackward>)
output :  tensor([[182043.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(3828503.7500, grad_fn=<MseLossBackward>)
output :  tensor([[196711.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(45044232., grad_fn=<MseLossBackward>)
output :  tensor([[239892.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4116e+09, grad_fn=<MseLossBackward>)
output :  tensor([[254293.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(7327595., grad_fn=<MseLossBackward>)
output :  tensor([[190737.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6451e+10, grad_fn=<MseLossBackward>)
output :  tensor([[142667.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6181e+09, grad_fn=<MseLossBackward>)
output :  tensor([[141682.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(7940772., grad_fn=<MseLossBackward>)
output :  tensor([[71093.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6680e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128456.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(42815552., grad_fn=<MseLossBackward>)
output :  tensor([[131817.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(8512536., grad_fn=<MseLossBackward>)
output :  tensor([[157608.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(13018566., grad_fn=<MseLossBackward>)
output :  tensor([[126073.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(857910.1250, grad_fn=<MseLossBackward>)
output :  tensor([[79374.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(8263379., grad_fn=<MseLossBackward>)
output :  tensor([[86062.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(16504351., grad_fn=<MseLossBackward>)
output :  tensor([[239164.]], grad_fn=<AddmmBackward>)
loss:  tensor(51322896., grad_fn=<MseLossBackward>)
output :  tensor([[140769.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9914e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133318.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(7941916.5000, grad_fn=<MseLossBackward>)
output :  tensor([[166933.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(4428.4863, grad_fn=<MseLossBackward>)
output :  tensor([[234654.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(119510.6484, grad_fn=<MseLossBackward>)
output :  tensor([[193307.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1363859., grad_fn=<MseLossBackward>)
output :  tensor([[157400.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1962013., grad_fn=<MseLossBackward>)
output :  tensor([[199834.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(3743559.7500, grad_fn=<MseLossBackward>)
output :  tensor([[205078.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0190e+09, grad_fn=<MseLossBackward>)
output :  tensor([[139153.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(4637226., grad_fn=<MseLossBackward>)
output :  tensor([[154425.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(329745.1250, grad_fn=<MseLossBackward>)
output :  tensor([[136563.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(317356.1875, grad_fn=<MseLossBackward>)
output :  tensor([[201442.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1555e+08, grad_fn=<MseLossBackward>)
output :  tensor([[155595.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2544573.2500, grad_fn=<MseLossBackward>)
output :  tensor([[137502.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9362e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146307.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1980616.3750, grad_fn=<MseLossBackward>)
output :  tensor([[210460.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2370733.7500, grad_fn=<MseLossBackward>)
output :  tensor([[99893.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2019e+08, grad_fn=<MseLossBackward>)
output :  tensor([[168985.]], grad_fn=<AddmmBackward>)
loss:  tensor(2205225., grad_fn=<MseLossBackward>)
output :  tensor([[127329.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(449015.1562, grad_fn=<MseLossBackward>)
output :  tensor([[146006.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(987663.3125, grad_fn=<MseLossBackward>)
output :  tensor([[106387.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9364e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136658.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(707543.8125, grad_fn=<MseLossBackward>)
output :  tensor([[239037.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(9227925., grad_fn=<MseLossBackward>)
output :  tensor([[144864.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(18432.3047, grad_fn=<MseLossBackward>)
output :  tensor([[139624.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4515226.5000, grad_fn=<MseLossBackward>)
output :  tensor([[164418.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3263e+09, grad_fn=<MseLossBackward>)
output :  tensor([[272529.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(29926712., grad_fn=<MseLossBackward>)
output :  tensor([[179243.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(18007160., grad_fn=<MseLossBackward>)
output :  tensor([[104353.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(2487150.7500, grad_fn=<MseLossBackward>)
output :  tensor([[204810.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2838e+09, grad_fn=<MseLossBackward>)
output :  tensor([[160408.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1985237., grad_fn=<MseLossBackward>)
output :  tensor([[162653.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6127e+10, grad_fn=<MseLossBackward>)
output :  tensor([[101011.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(7354605., grad_fn=<MseLossBackward>)
output :  tensor([[125148.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2398917., grad_fn=<MseLossBackward>)
output :  tensor([[157126.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1269495.1250, grad_fn=<MseLossBackward>)
output :  tensor([[140355.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(126680.3828, grad_fn=<MseLossBackward>)
output :  tensor([[201262.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1593551.2500, grad_fn=<MseLossBackward>)
output :  tensor([[145244.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(10524448., grad_fn=<MseLossBackward>)
output :  tensor([[264948.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(7118724.5000, grad_fn=<MseLossBackward>)
output :  tensor([[127298.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1764e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166769.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1610916.2500, grad_fn=<MseLossBackward>)
output :  tensor([[186666.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(3361894.2500, grad_fn=<MseLossBackward>)
output :  tensor([[124861.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2087e+08, grad_fn=<MseLossBackward>)
output :  tensor([[254511.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(20356876., grad_fn=<MseLossBackward>)
output :  tensor([[158222.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2813e+08, grad_fn=<MseLossBackward>)
output :  tensor([[242455.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(8375778.5000, grad_fn=<MseLossBackward>)
output :  tensor([[143455.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(296633.4062, grad_fn=<MseLossBackward>)
output :  tensor([[211727.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2985822., grad_fn=<MseLossBackward>)
output :  tensor([[174612.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(4895363.5000, grad_fn=<MseLossBackward>)
output :  tensor([[153934.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(4341.5742, grad_fn=<MseLossBackward>)
output :  tensor([[121991.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(15928455., grad_fn=<MseLossBackward>)
output :  tensor([[235829.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6276e+09, grad_fn=<MseLossBackward>)
output :  tensor([[236922.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(9473795., grad_fn=<MseLossBackward>)
output :  tensor([[152620.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(513461.8125, grad_fn=<MseLossBackward>)
output :  tensor([[255376.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(226799.1875, grad_fn=<MseLossBackward>)
output :  tensor([[124921.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0853e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176031.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1006.0791, grad_fn=<MseLossBackward>)
output :  tensor([[162042.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(4171997.7500, grad_fn=<MseLossBackward>)
output :  tensor([[135070.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(16572787., grad_fn=<MseLossBackward>)
output :  tensor([[193319.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0730e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163972.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(767.4631, grad_fn=<MseLossBackward>)
output :  tensor([[164668.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2785404.5000, grad_fn=<MseLossBackward>)
output :  tensor([[156028.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(3885025.7500, grad_fn=<MseLossBackward>)
output :  tensor([[154943.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(25433424., grad_fn=<MseLossBackward>)
output :  tensor([[173224.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0608e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159275.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(525307.8750, grad_fn=<MseLossBackward>)
output :  tensor([[378476.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(30179228., grad_fn=<MseLossBackward>)
output :  tensor([[138016.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2137e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129208.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9104e+09, grad_fn=<MseLossBackward>)
output :  tensor([[282098.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(784774.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163709.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2921268.5000, grad_fn=<MseLossBackward>)
output :  tensor([[130198.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(94059688., grad_fn=<MseLossBackward>)
output :  tensor([[240799.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(77425152., grad_fn=<MseLossBackward>)
output :  tensor([[179057.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2080310.3750, grad_fn=<MseLossBackward>)
output :  tensor([[153721.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2963347., grad_fn=<MseLossBackward>)
output :  tensor([[144312.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(472613.2812, grad_fn=<MseLossBackward>)
output :  tensor([[153563.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7766e+08, grad_fn=<MseLossBackward>)
output :  tensor([[101661.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2761880.5000, grad_fn=<MseLossBackward>)
output :  tensor([[71665.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3608e+08, grad_fn=<MseLossBackward>)
output :  tensor([[167293.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(5259282., grad_fn=<MseLossBackward>)
output :  tensor([[188100.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5920e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159021.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1042983.5000, grad_fn=<MseLossBackward>)
output :  tensor([[161831.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(18759862., grad_fn=<MseLossBackward>)
output :  tensor([[139501.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(4207049.5000, grad_fn=<MseLossBackward>)
output :  tensor([[204251.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2885273.7500, grad_fn=<MseLossBackward>)
output :  tensor([[139579.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2494869.5000, grad_fn=<MseLossBackward>)
output :  tensor([[183190.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6081e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145491.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(259017.3750, grad_fn=<MseLossBackward>)
output :  tensor([[108774.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6433e+08, grad_fn=<MseLossBackward>)
output :  tensor([[94794.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(630870.3125, grad_fn=<MseLossBackward>)
output :  tensor([[175381.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(145220.5312, grad_fn=<MseLossBackward>)
output :  tensor([[258480.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(3683280.7500, grad_fn=<MseLossBackward>)
output :  tensor([[140515.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(968379., grad_fn=<MseLossBackward>)
output :  tensor([[159399.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(245071.4062, grad_fn=<MseLossBackward>)
output :  tensor([[133742.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1543262.7500, grad_fn=<MseLossBackward>)
output :  tensor([[147570.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3721885., grad_fn=<MseLossBackward>)
output :  tensor([[168857.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(916866.1250, grad_fn=<MseLossBackward>)
output :  tensor([[129700.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(7290675., grad_fn=<MseLossBackward>)
output :  tensor([[170280.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3911e+08, grad_fn=<MseLossBackward>)
output :  tensor([[155623.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1894580.2500, grad_fn=<MseLossBackward>)
output :  tensor([[116458.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1714.4775, grad_fn=<MseLossBackward>)
output :  tensor([[159883.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3460e+09, grad_fn=<MseLossBackward>)
output :  tensor([[55663.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(13424610., grad_fn=<MseLossBackward>)
output :  tensor([[231427.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5728e+09, grad_fn=<MseLossBackward>)
output :  tensor([[199921.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1162656.7500, grad_fn=<MseLossBackward>)
output :  tensor([[184211.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(621485.8750, grad_fn=<MseLossBackward>)
output :  tensor([[105226.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(598133.0625, grad_fn=<MseLossBackward>)
output :  tensor([[87657.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(431679.8125, grad_fn=<MseLossBackward>)
output :  tensor([[146235.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(38877952., grad_fn=<MseLossBackward>)
output :  tensor([[222827.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0655e+09, grad_fn=<MseLossBackward>)
output :  tensor([[205987.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2288270.7500, grad_fn=<MseLossBackward>)
output :  tensor([[159969.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(25303100., grad_fn=<MseLossBackward>)
output :  tensor([[173977.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2850e+09, grad_fn=<MseLossBackward>)
output :  tensor([[190410.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(168394.8125, grad_fn=<MseLossBackward>)
output :  tensor([[91675.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(21862492., grad_fn=<MseLossBackward>)
output :  tensor([[140187.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(35115.2461, grad_fn=<MseLossBackward>)
output :  tensor([[112707.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(4872849.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145906.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(98933176., grad_fn=<MseLossBackward>)
output :  tensor([[171986.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6799e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194313.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1420e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177548.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(6011078., grad_fn=<MseLossBackward>)
output :  tensor([[98646.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(4609139.5000, grad_fn=<MseLossBackward>)
output :  tensor([[117450.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2411.7307, grad_fn=<MseLossBackward>)
output :  tensor([[161316.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1453e+08, grad_fn=<MseLossBackward>)
output :  tensor([[199748.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(63008.8438, grad_fn=<MseLossBackward>)
output :  tensor([[144994.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(988470.9375, grad_fn=<MseLossBackward>)
train_loss: [2.5639122e+09]
epoch_result tensor([0.])
output :  tensor([[156591.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(3642133.7500, grad_fn=<MseLossBackward>)
output :  tensor([[121054.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(893054.5625, grad_fn=<MseLossBackward>)
output :  tensor([[194674.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(223847.2656, grad_fn=<MseLossBackward>)
output :  tensor([[178008.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1017355.9375, grad_fn=<MseLossBackward>)
output :  tensor([[153099.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2003e+08, grad_fn=<MseLossBackward>)
output :  tensor([[124275.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(13873763., grad_fn=<MseLossBackward>)
output :  tensor([[141699.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(489278.4062, grad_fn=<MseLossBackward>)
output :  tensor([[117148.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(3428978., grad_fn=<MseLossBackward>)
output :  tensor([[63999.6680]], grad_fn=<AddmmBackward>)
loss:  tensor(30246348., grad_fn=<MseLossBackward>)
output :  tensor([[165388.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(373607.4688, grad_fn=<MseLossBackward>)
output :  tensor([[142007.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(4029554.5000, grad_fn=<MseLossBackward>)
output :  tensor([[227102.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(4422280.5000, grad_fn=<MseLossBackward>)
output :  tensor([[165247.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(14079966., grad_fn=<MseLossBackward>)
output :  tensor([[246882.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(7940331.5000, grad_fn=<MseLossBackward>)
output :  tensor([[58090.4414]], grad_fn=<AddmmBackward>)
loss:  tensor(9550828., grad_fn=<MseLossBackward>)
output :  tensor([[161458.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8758e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172477.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(6363242.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162465.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(35592784., grad_fn=<MseLossBackward>)
output :  tensor([[276735.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3011851.7500, grad_fn=<MseLossBackward>)
output :  tensor([[198276.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1629611.8750, grad_fn=<MseLossBackward>)
output :  tensor([[138755.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4936e+10, grad_fn=<MseLossBackward>)
output :  tensor([[194219.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(115748.7969, grad_fn=<MseLossBackward>)
output :  tensor([[179071.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1002e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151779.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(607961.3125, grad_fn=<MseLossBackward>)
output :  tensor([[167164.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(8038554., grad_fn=<MseLossBackward>)
output :  tensor([[86351.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(905991.6250, grad_fn=<MseLossBackward>)
output :  tensor([[170490.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3051e+09, grad_fn=<MseLossBackward>)
output :  tensor([[183090.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(3647503.2500, grad_fn=<MseLossBackward>)
output :  tensor([[208058.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2507e+09, grad_fn=<MseLossBackward>)
output :  tensor([[110629.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(395827.7500, grad_fn=<MseLossBackward>)
output :  tensor([[169444.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2419094.2500, grad_fn=<MseLossBackward>)
output :  tensor([[134662.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(3375487.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128524.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(225706.6406, grad_fn=<MseLossBackward>)
output :  tensor([[119588.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(7865.4727, grad_fn=<MseLossBackward>)
output :  tensor([[146876.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(8.9259e+08, grad_fn=<MseLossBackward>)
output :  tensor([[167398.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1786e+10, grad_fn=<MseLossBackward>)
output :  tensor([[149969.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(72411.4453, grad_fn=<MseLossBackward>)
output :  tensor([[180385.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(148887.4531, grad_fn=<MseLossBackward>)
output :  tensor([[142293.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1672051., grad_fn=<MseLossBackward>)
output :  tensor([[106699.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7887e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136582.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1494e+09, grad_fn=<MseLossBackward>)
output :  tensor([[135002.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7354, grad_fn=<MseLossBackward>)
output :  tensor([[132860.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(34342164., grad_fn=<MseLossBackward>)
output :  tensor([[225954.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(910443.9375, grad_fn=<MseLossBackward>)
output :  tensor([[132408.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(25077.6914, grad_fn=<MseLossBackward>)
output :  tensor([[151531.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(6407701., grad_fn=<MseLossBackward>)
output :  tensor([[112631.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(399167.2812, grad_fn=<MseLossBackward>)
output :  tensor([[160102.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(10471.0449, grad_fn=<MseLossBackward>)
output :  tensor([[146408.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3611e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192092.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(8562.0322, grad_fn=<MseLossBackward>)
output :  tensor([[135379.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(863447.5000, grad_fn=<MseLossBackward>)
output :  tensor([[117494.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(56165424., grad_fn=<MseLossBackward>)
output :  tensor([[234597.]], grad_fn=<AddmmBackward>)
loss:  tensor(356409., grad_fn=<MseLossBackward>)
output :  tensor([[167082.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1537e+09, grad_fn=<MseLossBackward>)
output :  tensor([[153363.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(31766610., grad_fn=<MseLossBackward>)
output :  tensor([[203959.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8406e+10, grad_fn=<MseLossBackward>)
output :  tensor([[244013.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2097e+10, grad_fn=<MseLossBackward>)
output :  tensor([[142647.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(725983.8750, grad_fn=<MseLossBackward>)
output :  tensor([[133750.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(62382.8672, grad_fn=<MseLossBackward>)
output :  tensor([[156691.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2861595.2500, grad_fn=<MseLossBackward>)
output :  tensor([[132258.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(5101951.5000, grad_fn=<MseLossBackward>)
output :  tensor([[179343.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5054e+09, grad_fn=<MseLossBackward>)
output :  tensor([[182422.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2812853., grad_fn=<MseLossBackward>)
output :  tensor([[164262.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(7629852.5000, grad_fn=<MseLossBackward>)
output :  tensor([[146434.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(11796542., grad_fn=<MseLossBackward>)
output :  tensor([[143085.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(342572.4375, grad_fn=<MseLossBackward>)
output :  tensor([[143943.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1115829.1250, grad_fn=<MseLossBackward>)
output :  tensor([[174230.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2845e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194250.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1755e+08, grad_fn=<MseLossBackward>)
output :  tensor([[138509.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(4038153., grad_fn=<MseLossBackward>)
output :  tensor([[168076.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(14619869., grad_fn=<MseLossBackward>)
output :  tensor([[176702.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(18468104., grad_fn=<MseLossBackward>)
output :  tensor([[118796.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(14414480., grad_fn=<MseLossBackward>)
output :  tensor([[217744.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(10600824., grad_fn=<MseLossBackward>)
output :  tensor([[186147.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(7007684.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128729.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(10429468., grad_fn=<MseLossBackward>)
output :  tensor([[193795.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(7316602.5000, grad_fn=<MseLossBackward>)
output :  tensor([[176735.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3368716., grad_fn=<MseLossBackward>)
output :  tensor([[211044.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0697e+10, grad_fn=<MseLossBackward>)
output :  tensor([[207171.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(14660643., grad_fn=<MseLossBackward>)
output :  tensor([[165114.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1638e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192432.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4276107., grad_fn=<MseLossBackward>)
output :  tensor([[112498.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(251337.7188, grad_fn=<MseLossBackward>)
output :  tensor([[115146.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(7005368.5000, grad_fn=<MseLossBackward>)
output :  tensor([[110817.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(1397438., grad_fn=<MseLossBackward>)
output :  tensor([[146223.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(331992.0312, grad_fn=<MseLossBackward>)
output :  tensor([[157863.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4144e+10, grad_fn=<MseLossBackward>)
output :  tensor([[178978.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1042951.5625, grad_fn=<MseLossBackward>)
output :  tensor([[127285.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(45886.3242, grad_fn=<MseLossBackward>)
output :  tensor([[144743.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(65904.5156, grad_fn=<MseLossBackward>)
output :  tensor([[180716.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0991e+09, grad_fn=<MseLossBackward>)
output :  tensor([[116599.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(90084.3984, grad_fn=<MseLossBackward>)
output :  tensor([[197333.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(111326.4922, grad_fn=<MseLossBackward>)
output :  tensor([[141848.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(9934907., grad_fn=<MseLossBackward>)
output :  tensor([[209823.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(9462641., grad_fn=<MseLossBackward>)
output :  tensor([[128243.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(5032451., grad_fn=<MseLossBackward>)
output :  tensor([[240908.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(55042488., grad_fn=<MseLossBackward>)
output :  tensor([[241026.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9337e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144143.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6240e+08, grad_fn=<MseLossBackward>)
output :  tensor([[84569.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5554e+08, grad_fn=<MseLossBackward>)
output :  tensor([[196565.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1362e+09, grad_fn=<MseLossBackward>)
output :  tensor([[82188.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(1411511.1250, grad_fn=<MseLossBackward>)
output :  tensor([[140081.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(338560.3438, grad_fn=<MseLossBackward>)
output :  tensor([[76201.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(491642., grad_fn=<MseLossBackward>)
output :  tensor([[142018.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(873816., grad_fn=<MseLossBackward>)
output :  tensor([[174153.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(3409620., grad_fn=<MseLossBackward>)
output :  tensor([[152577.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(850573.8750, grad_fn=<MseLossBackward>)
output :  tensor([[109642.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(5030453., grad_fn=<MseLossBackward>)
output :  tensor([[205824.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2084e+10, grad_fn=<MseLossBackward>)
output :  tensor([[130382.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(3544835.7500, grad_fn=<MseLossBackward>)
output :  tensor([[268920.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2276e+08, grad_fn=<MseLossBackward>)
output :  tensor([[310790.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(624346.8750, grad_fn=<MseLossBackward>)
output :  tensor([[111420.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(15367074., grad_fn=<MseLossBackward>)
output :  tensor([[170463.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(4145805., grad_fn=<MseLossBackward>)
output :  tensor([[133504.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5048e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148281.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(86141312., grad_fn=<MseLossBackward>)
output :  tensor([[128519.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2995549.7500, grad_fn=<MseLossBackward>)
output :  tensor([[127743.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(7527306.5000, grad_fn=<MseLossBackward>)
output :  tensor([[133990.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9976e+08, grad_fn=<MseLossBackward>)
output :  tensor([[226992.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8419e+10, grad_fn=<MseLossBackward>)
output :  tensor([[190970.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2509e+10, grad_fn=<MseLossBackward>)
output :  tensor([[141575.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(5405189., grad_fn=<MseLossBackward>)
output :  tensor([[128339.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(704642.1875, grad_fn=<MseLossBackward>)
output :  tensor([[112839.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2525616.2500, grad_fn=<MseLossBackward>)
output :  tensor([[256757.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7581e+09, grad_fn=<MseLossBackward>)
output :  tensor([[134202.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(636180.6875, grad_fn=<MseLossBackward>)
output :  tensor([[204098.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1207423.2500, grad_fn=<MseLossBackward>)
output :  tensor([[101449.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(11903147., grad_fn=<MseLossBackward>)
output :  tensor([[140803.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(728648.9375, grad_fn=<MseLossBackward>)
output :  tensor([[211469.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6979e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177001.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(8403386., grad_fn=<MseLossBackward>)
output :  tensor([[187725.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(7430735.5000, grad_fn=<MseLossBackward>)
output :  tensor([[165010.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0733e+10, grad_fn=<MseLossBackward>)
output :  tensor([[304133.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(9.5273e+08, grad_fn=<MseLossBackward>)
output :  tensor([[199587.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2846074.5000, grad_fn=<MseLossBackward>)
output :  tensor([[259850.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0452e+10, grad_fn=<MseLossBackward>)
output :  tensor([[227504.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4819e+09, grad_fn=<MseLossBackward>)
output :  tensor([[286044.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(9.5825e+08, grad_fn=<MseLossBackward>)
output :  tensor([[225171.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1373364.2500, grad_fn=<MseLossBackward>)
output :  tensor([[222096.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8867e+10, grad_fn=<MseLossBackward>)
output :  tensor([[197895.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(802144.1250, grad_fn=<MseLossBackward>)
output :  tensor([[158174.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5116e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134769.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(5151126.5000, grad_fn=<MseLossBackward>)
output :  tensor([[134797.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(493769.7188, grad_fn=<MseLossBackward>)
output :  tensor([[91672.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(452760.7500, grad_fn=<MseLossBackward>)
output :  tensor([[111142.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(9872311., grad_fn=<MseLossBackward>)
output :  tensor([[271792.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2613e+09, grad_fn=<MseLossBackward>)
output :  tensor([[230987.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(16103918., grad_fn=<MseLossBackward>)
output :  tensor([[144066.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(871830.6875, grad_fn=<MseLossBackward>)
output :  tensor([[135333.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(4693857.5000, grad_fn=<MseLossBackward>)
output :  tensor([[175779.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(4189057.7500, grad_fn=<MseLossBackward>)
output :  tensor([[143360.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(3571686.5000, grad_fn=<MseLossBackward>)
output :  tensor([[165858.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2031e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165249.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(62242.4531, grad_fn=<MseLossBackward>)
output :  tensor([[140806.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(14490394., grad_fn=<MseLossBackward>)
output :  tensor([[188827.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3994e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113783.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(3181680.5000, grad_fn=<MseLossBackward>)
output :  tensor([[169591.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(5798840.5000, grad_fn=<MseLossBackward>)
output :  tensor([[117923.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(4310425., grad_fn=<MseLossBackward>)
output :  tensor([[86105.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(800871.1875, grad_fn=<MseLossBackward>)
output :  tensor([[178541.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2125809.5000, grad_fn=<MseLossBackward>)
output :  tensor([[112625.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(7428776., grad_fn=<MseLossBackward>)
output :  tensor([[242154.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(9952842., grad_fn=<MseLossBackward>)
output :  tensor([[248885.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(15095532., grad_fn=<MseLossBackward>)
output :  tensor([[127721.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(3164174., grad_fn=<MseLossBackward>)
output :  tensor([[115000.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(36495096., grad_fn=<MseLossBackward>)
output :  tensor([[289931.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1674e+10, grad_fn=<MseLossBackward>)
output :  tensor([[175520.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(16167938., grad_fn=<MseLossBackward>)
output :  tensor([[123107.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(3580728.2500, grad_fn=<MseLossBackward>)
output :  tensor([[144205.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8671e+08, grad_fn=<MseLossBackward>)
output :  tensor([[203522.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0977e+08, grad_fn=<MseLossBackward>)
output :  tensor([[140979.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(405.6448, grad_fn=<MseLossBackward>)
output :  tensor([[160034.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4392e+10, grad_fn=<MseLossBackward>)
output :  tensor([[153786.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(12924.8477, grad_fn=<MseLossBackward>)
output :  tensor([[128394.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(1222907.6250, grad_fn=<MseLossBackward>)
output :  tensor([[252627.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5844e+10, grad_fn=<MseLossBackward>)
output :  tensor([[400411.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2524126.5000, grad_fn=<MseLossBackward>)
output :  tensor([[106708.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(5250578.5000, grad_fn=<MseLossBackward>)
output :  tensor([[119760.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(1589234.5000, grad_fn=<MseLossBackward>)
output :  tensor([[157443.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(4229321., grad_fn=<MseLossBackward>)
output :  tensor([[130181.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6733e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163073.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4723e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174268.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1304e+09, grad_fn=<MseLossBackward>)
output :  tensor([[104736.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(1291898.6250, grad_fn=<MseLossBackward>)
output :  tensor([[140481.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(269150.1875, grad_fn=<MseLossBackward>)
output :  tensor([[365370.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3698770.2500, grad_fn=<MseLossBackward>)
output :  tensor([[206510.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2552e+09, grad_fn=<MseLossBackward>)
output :  tensor([[176601.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1213336.6250, grad_fn=<MseLossBackward>)
output :  tensor([[202528.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(137722.1719, grad_fn=<MseLossBackward>)
output :  tensor([[139648.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(420207.8125, grad_fn=<MseLossBackward>)
output :  tensor([[192107.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(5723832., grad_fn=<MseLossBackward>)
output :  tensor([[135972.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1066e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175549.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(29703010., grad_fn=<MseLossBackward>)
output :  tensor([[241865.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(18132.3047, grad_fn=<MseLossBackward>)
output :  tensor([[174156.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(24443.3672, grad_fn=<MseLossBackward>)
output :  tensor([[109747.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(3055476.7500, grad_fn=<MseLossBackward>)
output :  tensor([[265386.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(681914.6875, grad_fn=<MseLossBackward>)
output :  tensor([[243222.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(45930060., grad_fn=<MseLossBackward>)
output :  tensor([[126082.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(9504552., grad_fn=<MseLossBackward>)
output :  tensor([[217018.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3618e+09, grad_fn=<MseLossBackward>)
output :  tensor([[304530.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3136e+08, grad_fn=<MseLossBackward>)
output :  tensor([[206833.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(27821.1973, grad_fn=<MseLossBackward>)
output :  tensor([[214943.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5639e+10, grad_fn=<MseLossBackward>)
output :  tensor([[159803.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(3624145., grad_fn=<MseLossBackward>)
output :  tensor([[172233.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(5031189., grad_fn=<MseLossBackward>)
output :  tensor([[162580.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(31909966., grad_fn=<MseLossBackward>)
output :  tensor([[168093.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(3634444.2500, grad_fn=<MseLossBackward>)
output :  tensor([[238379.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7739e+08, grad_fn=<MseLossBackward>)
output :  tensor([[224010.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(29652280., grad_fn=<MseLossBackward>)
output :  tensor([[159811.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6412e+08, grad_fn=<MseLossBackward>)
output :  tensor([[120999.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(4001187.5000, grad_fn=<MseLossBackward>)
output :  tensor([[178498.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2244050.7500, grad_fn=<MseLossBackward>)
output :  tensor([[182141.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0620e+09, grad_fn=<MseLossBackward>)
output :  tensor([[210880.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3759e+10, grad_fn=<MseLossBackward>)
output :  tensor([[135463.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1063960., grad_fn=<MseLossBackward>)
output :  tensor([[147536.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7271e+08, grad_fn=<MseLossBackward>)
output :  tensor([[274709.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(5244959., grad_fn=<MseLossBackward>)
output :  tensor([[88735.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(13956178., grad_fn=<MseLossBackward>)
output :  tensor([[235128.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1882341.1250, grad_fn=<MseLossBackward>)
output :  tensor([[258610.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0519e+11, grad_fn=<MseLossBackward>)
output :  tensor([[170140.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(19872.1875, grad_fn=<MseLossBackward>)
output :  tensor([[195417.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5668e+09, grad_fn=<MseLossBackward>)
output :  tensor([[156034.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1070642.8750, grad_fn=<MseLossBackward>)
output :  tensor([[206827.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9908e+09, grad_fn=<MseLossBackward>)
output :  tensor([[129215.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(46302.2969, grad_fn=<MseLossBackward>)
output :  tensor([[146449.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2102364., grad_fn=<MseLossBackward>)
output :  tensor([[169205.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1316e+08, grad_fn=<MseLossBackward>)
output :  tensor([[187519.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2786708.5000, grad_fn=<MseLossBackward>)
output :  tensor([[127977.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(3910753.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138631.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4541227.5000, grad_fn=<MseLossBackward>)
output :  tensor([[168785.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(17760562., grad_fn=<MseLossBackward>)
output :  tensor([[197945.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7097e+09, grad_fn=<MseLossBackward>)
output :  tensor([[236698.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(39710476., grad_fn=<MseLossBackward>)
output :  tensor([[152543.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(6035697.5000, grad_fn=<MseLossBackward>)
output :  tensor([[198569.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(6603374., grad_fn=<MseLossBackward>)
output :  tensor([[160771.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8128e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178505.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(989465.3750, grad_fn=<MseLossBackward>)
output :  tensor([[179462.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(191269.5625, grad_fn=<MseLossBackward>)
output :  tensor([[100268.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(10684063., grad_fn=<MseLossBackward>)
output :  tensor([[172720.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1509e+10, grad_fn=<MseLossBackward>)
output :  tensor([[135076.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(5830.7539, grad_fn=<MseLossBackward>)
output :  tensor([[119346.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(18892402., grad_fn=<MseLossBackward>)
output :  tensor([[174803.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(644934.5000, grad_fn=<MseLossBackward>)
output :  tensor([[87572.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(6619525., grad_fn=<MseLossBackward>)
output :  tensor([[292302.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(5301650., grad_fn=<MseLossBackward>)
output :  tensor([[169515.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(20392986., grad_fn=<MseLossBackward>)
output :  tensor([[191081.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0189e+10, grad_fn=<MseLossBackward>)
output :  tensor([[246578.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9641e+08, grad_fn=<MseLossBackward>)
output :  tensor([[156248.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(27542652., grad_fn=<MseLossBackward>)
output :  tensor([[123516.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(234248.4375, grad_fn=<MseLossBackward>)
output :  tensor([[122614.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(7368934.5000, grad_fn=<MseLossBackward>)
output :  tensor([[142482.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5530e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174607.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(368847.4375, grad_fn=<MseLossBackward>)
output :  tensor([[111002.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1238e+08, grad_fn=<MseLossBackward>)
output :  tensor([[210778.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1496e+10, grad_fn=<MseLossBackward>)
output :  tensor([[247651.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(37846912., grad_fn=<MseLossBackward>)
output :  tensor([[249538.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1215e+10, grad_fn=<MseLossBackward>)
output :  tensor([[222100.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8559e+08, grad_fn=<MseLossBackward>)
output :  tensor([[196143.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4246e+10, grad_fn=<MseLossBackward>)
output :  tensor([[189877.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(5653472., grad_fn=<MseLossBackward>)
output :  tensor([[204753.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8451e+10, grad_fn=<MseLossBackward>)
output :  tensor([[189390.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1494e+10, grad_fn=<MseLossBackward>)
output :  tensor([[179971.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1515784.1250, grad_fn=<MseLossBackward>)
output :  tensor([[151896.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(10734.9023, grad_fn=<MseLossBackward>)
output :  tensor([[333231.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(14204183., grad_fn=<MseLossBackward>)
output :  tensor([[213577.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2488555.5000, grad_fn=<MseLossBackward>)
output :  tensor([[156140.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(14898514., grad_fn=<MseLossBackward>)
output :  tensor([[189107.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7450e+09, grad_fn=<MseLossBackward>)
output :  tensor([[105957.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(916537., grad_fn=<MseLossBackward>)
output :  tensor([[276270.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7690e+10, grad_fn=<MseLossBackward>)
output :  tensor([[171479.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(5860333., grad_fn=<MseLossBackward>)
output :  tensor([[210144.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(11262107., grad_fn=<MseLossBackward>)
output :  tensor([[213634.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(54252200., grad_fn=<MseLossBackward>)
output :  tensor([[177297.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(3620873.7500, grad_fn=<MseLossBackward>)
output :  tensor([[204378.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(6649548.5000, grad_fn=<MseLossBackward>)
output :  tensor([[155709.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(503257.2188, grad_fn=<MseLossBackward>)
output :  tensor([[146164.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1312e+09, grad_fn=<MseLossBackward>)
output :  tensor([[116260.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(5017530., grad_fn=<MseLossBackward>)
output :  tensor([[137282.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(7386674.5000, grad_fn=<MseLossBackward>)
output :  tensor([[151509.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(6296727.5000, grad_fn=<MseLossBackward>)
output :  tensor([[201370.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6035e+10, grad_fn=<MseLossBackward>)
output :  tensor([[160579.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1164780.5000, grad_fn=<MseLossBackward>)
output :  tensor([[100064.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(319039.6250, grad_fn=<MseLossBackward>)
output :  tensor([[221356.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4758e+08, grad_fn=<MseLossBackward>)
output :  tensor([[184334.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5474e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174304.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(4756556.5000, grad_fn=<MseLossBackward>)
output :  tensor([[82557.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(310632.0625, grad_fn=<MseLossBackward>)
output :  tensor([[127998.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(251251.5625, grad_fn=<MseLossBackward>)
output :  tensor([[212118.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(3540218.7500, grad_fn=<MseLossBackward>)
output :  tensor([[143861.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(19147.6406, grad_fn=<MseLossBackward>)
output :  tensor([[134228.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(17880608., grad_fn=<MseLossBackward>)
output :  tensor([[143131.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(282891., grad_fn=<MseLossBackward>)
output :  tensor([[175905.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4750e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145355.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1837337.8750, grad_fn=<MseLossBackward>)
output :  tensor([[160136.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(18547.0352, grad_fn=<MseLossBackward>)
output :  tensor([[215124.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(15554.7666, grad_fn=<MseLossBackward>)
output :  tensor([[135987.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6020e+08, grad_fn=<MseLossBackward>)
output :  tensor([[250973.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(16208928., grad_fn=<MseLossBackward>)
output :  tensor([[158406.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1196084., grad_fn=<MseLossBackward>)
output :  tensor([[127899.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(360384.4688, grad_fn=<MseLossBackward>)
output :  tensor([[95224.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(50309.0898, grad_fn=<MseLossBackward>)
output :  tensor([[149377.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2090e+09, grad_fn=<MseLossBackward>)
output :  tensor([[179958.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(3365.8127, grad_fn=<MseLossBackward>)
output :  tensor([[122637.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(4569240., grad_fn=<MseLossBackward>)
output :  tensor([[191610.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3943e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145740.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3878e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151135.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1525456.6250, grad_fn=<MseLossBackward>)
output :  tensor([[188499.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(561914.1875, grad_fn=<MseLossBackward>)
output :  tensor([[252470.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6488e+09, grad_fn=<MseLossBackward>)
output :  tensor([[91929.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(184799.2344, grad_fn=<MseLossBackward>)
output :  tensor([[235059.]], grad_fn=<AddmmBackward>)
loss:  tensor(24413480., grad_fn=<MseLossBackward>)
output :  tensor([[125676.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(7973696.5000, grad_fn=<MseLossBackward>)
output :  tensor([[166004.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9791e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113304.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7701e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175583.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(173628.4688, grad_fn=<MseLossBackward>)
output :  tensor([[162998.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5690e+08, grad_fn=<MseLossBackward>)
output :  tensor([[154695.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8540e+08, grad_fn=<MseLossBackward>)
output :  tensor([[236011.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(8932907., grad_fn=<MseLossBackward>)
output :  tensor([[223098.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2181e+09, grad_fn=<MseLossBackward>)
output :  tensor([[126929.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(4926.2852, grad_fn=<MseLossBackward>)
output :  tensor([[123712.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(5234157.5000, grad_fn=<MseLossBackward>)
output :  tensor([[223881.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(9722314., grad_fn=<MseLossBackward>)
output :  tensor([[231578.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(5861392.5000, grad_fn=<MseLossBackward>)
output :  tensor([[230009.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(10955997., grad_fn=<MseLossBackward>)
output :  tensor([[146387.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2600609.7500, grad_fn=<MseLossBackward>)
output :  tensor([[203504.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(42189692., grad_fn=<MseLossBackward>)
output :  tensor([[129203.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(84698088., grad_fn=<MseLossBackward>)
output :  tensor([[133945.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2088386.2500, grad_fn=<MseLossBackward>)
output :  tensor([[310805.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(17597238., grad_fn=<MseLossBackward>)
output :  tensor([[138729.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(5155312., grad_fn=<MseLossBackward>)
output :  tensor([[121679.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9899e+09, grad_fn=<MseLossBackward>)
output :  tensor([[108908.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(349558.0938, grad_fn=<MseLossBackward>)
output :  tensor([[156969.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4119e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180146.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(8.9451e+09, grad_fn=<MseLossBackward>)
output :  tensor([[176030.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(9181468., grad_fn=<MseLossBackward>)
output :  tensor([[195339.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(32036308., grad_fn=<MseLossBackward>)
output :  tensor([[106738.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(45400960., grad_fn=<MseLossBackward>)
output :  tensor([[175786.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(10328390., grad_fn=<MseLossBackward>)
output :  tensor([[171713.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(14541948., grad_fn=<MseLossBackward>)
output :  tensor([[139276.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(76227.7578, grad_fn=<MseLossBackward>)
output :  tensor([[262718.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2894e+09, grad_fn=<MseLossBackward>)
output :  tensor([[142311.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2846e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173028.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(805.1406, grad_fn=<MseLossBackward>)
output :  tensor([[138878.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1257096.5000, grad_fn=<MseLossBackward>)
output :  tensor([[194725.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(33339978., grad_fn=<MseLossBackward>)
output :  tensor([[167564.]], grad_fn=<AddmmBackward>)
loss:  tensor(5934096., grad_fn=<MseLossBackward>)
output :  tensor([[240685.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(10985807., grad_fn=<MseLossBackward>)
output :  tensor([[133073.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2034055.3750, grad_fn=<MseLossBackward>)
output :  tensor([[150556.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1455453.7500, grad_fn=<MseLossBackward>)
output :  tensor([[214443.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(309292.4062, grad_fn=<MseLossBackward>)
output :  tensor([[159863.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(26384756., grad_fn=<MseLossBackward>)
output :  tensor([[186037.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(8776777., grad_fn=<MseLossBackward>)
output :  tensor([[132026.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2755e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130382.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(1912408.1250, grad_fn=<MseLossBackward>)
output :  tensor([[139717.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(79859.2266, grad_fn=<MseLossBackward>)
output :  tensor([[206237.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0022e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166324.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6342e+09, grad_fn=<MseLossBackward>)
output :  tensor([[74743.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1738e+08, grad_fn=<MseLossBackward>)
output :  tensor([[93244.]], grad_fn=<AddmmBackward>)
loss:  tensor(76457536., grad_fn=<MseLossBackward>)
output :  tensor([[261711.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(70868512., grad_fn=<MseLossBackward>)
output :  tensor([[202239.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9993e+09, grad_fn=<MseLossBackward>)
output :  tensor([[114196.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(645875.9375, grad_fn=<MseLossBackward>)
output :  tensor([[159027.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1070e+08, grad_fn=<MseLossBackward>)
output :  tensor([[209924.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0152e+08, grad_fn=<MseLossBackward>)
output :  tensor([[182035.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7378e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158890.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(15136841., grad_fn=<MseLossBackward>)
output :  tensor([[172174.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(4727227., grad_fn=<MseLossBackward>)
output :  tensor([[114102.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(805352., grad_fn=<MseLossBackward>)
output :  tensor([[160663.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(32077534., grad_fn=<MseLossBackward>)
output :  tensor([[194771.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4711e+08, grad_fn=<MseLossBackward>)
output :  tensor([[218723.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(602928., grad_fn=<MseLossBackward>)
output :  tensor([[245792.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4921e+11, grad_fn=<MseLossBackward>)
output :  tensor([[144309.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(7240724., grad_fn=<MseLossBackward>)
output :  tensor([[108768.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(83196.1875, grad_fn=<MseLossBackward>)
output :  tensor([[171587.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0635e+08, grad_fn=<MseLossBackward>)
output :  tensor([[151593.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1194785.6250, grad_fn=<MseLossBackward>)
output :  tensor([[234890.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(4449001.5000, grad_fn=<MseLossBackward>)
output :  tensor([[116829.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(3345955.5000, grad_fn=<MseLossBackward>)
output :  tensor([[178313.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(21032972., grad_fn=<MseLossBackward>)
output :  tensor([[185595.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1219747.6250, grad_fn=<MseLossBackward>)
output :  tensor([[163459.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4505e+10, grad_fn=<MseLossBackward>)
output :  tensor([[94742.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8886e+08, grad_fn=<MseLossBackward>)
output :  tensor([[241729.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(7449999.5000, grad_fn=<MseLossBackward>)
output :  tensor([[176626.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(393070.2188, grad_fn=<MseLossBackward>)
output :  tensor([[139117.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(779578.6250, grad_fn=<MseLossBackward>)
output :  tensor([[237514.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(6320667.5000, grad_fn=<MseLossBackward>)
output :  tensor([[168459.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(29803240., grad_fn=<MseLossBackward>)
output :  tensor([[205058.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4386e+10, grad_fn=<MseLossBackward>)
output :  tensor([[131693.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(10935939., grad_fn=<MseLossBackward>)
output :  tensor([[186514.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0094e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137950.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(3802804.7500, grad_fn=<MseLossBackward>)
output :  tensor([[227359.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(74653648., grad_fn=<MseLossBackward>)
output :  tensor([[227765.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9439e+08, grad_fn=<MseLossBackward>)
output :  tensor([[91900.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(3610920.2500, grad_fn=<MseLossBackward>)
output :  tensor([[161428.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3976410., grad_fn=<MseLossBackward>)
output :  tensor([[243834.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6140e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144949.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2542.3655, grad_fn=<MseLossBackward>)
output :  tensor([[109174.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7787e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164001.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(248097.3906, grad_fn=<MseLossBackward>)
output :  tensor([[143074.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(856492.4375, grad_fn=<MseLossBackward>)
output :  tensor([[129572.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1884785.7500, grad_fn=<MseLossBackward>)
output :  tensor([[187274.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1445e+09, grad_fn=<MseLossBackward>)
output :  tensor([[123746.]], grad_fn=<AddmmBackward>)
loss:  tensor(1552516., grad_fn=<MseLossBackward>)
output :  tensor([[153538.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2366357.2500, grad_fn=<MseLossBackward>)
output :  tensor([[170066.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2833488.2500, grad_fn=<MseLossBackward>)
output :  tensor([[152206.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1456132.3750, grad_fn=<MseLossBackward>)
output :  tensor([[160159.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(7512567., grad_fn=<MseLossBackward>)
output :  tensor([[136385.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4995e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131664.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(112476.3906, grad_fn=<MseLossBackward>)
output :  tensor([[153536.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1132e+08, grad_fn=<MseLossBackward>)
output :  tensor([[146743.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(6715305.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162247.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(247941.7500, grad_fn=<MseLossBackward>)
output :  tensor([[135370.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4873e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148051.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(559550.7500, grad_fn=<MseLossBackward>)
output :  tensor([[183147.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(23544936., grad_fn=<MseLossBackward>)
output :  tensor([[170068.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1140991.1250, grad_fn=<MseLossBackward>)
output :  tensor([[178281.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2952866.2500, grad_fn=<MseLossBackward>)
output :  tensor([[223148.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(9914922., grad_fn=<MseLossBackward>)
output :  tensor([[107539.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(130151.8359, grad_fn=<MseLossBackward>)
output :  tensor([[137107.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4902e+08, grad_fn=<MseLossBackward>)
output :  tensor([[285426.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(328973.9375, grad_fn=<MseLossBackward>)
output :  tensor([[117918.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3681721.5000, grad_fn=<MseLossBackward>)
output :  tensor([[180030.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5976e+09, grad_fn=<MseLossBackward>)
output :  tensor([[183548.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2106716.2500, grad_fn=<MseLossBackward>)
output :  tensor([[187522.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(4092213., grad_fn=<MseLossBackward>)
output :  tensor([[250659.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9247e+08, grad_fn=<MseLossBackward>)
output :  tensor([[221462.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(288889.4688, grad_fn=<MseLossBackward>)
output :  tensor([[125256.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7467e+08, grad_fn=<MseLossBackward>)
output :  tensor([[171895.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5703e+08, grad_fn=<MseLossBackward>)
output :  tensor([[125706.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2913582.2500, grad_fn=<MseLossBackward>)
output :  tensor([[182904.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5472e+10, grad_fn=<MseLossBackward>)
output :  tensor([[151657.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1801677., grad_fn=<MseLossBackward>)
output :  tensor([[153738.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(52394300., grad_fn=<MseLossBackward>)
output :  tensor([[203356.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(8666216., grad_fn=<MseLossBackward>)
output :  tensor([[145779.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7636e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176396.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(156976.9219, grad_fn=<MseLossBackward>)
output :  tensor([[252141.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4848e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148490.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(240360.3906, grad_fn=<MseLossBackward>)
output :  tensor([[199656.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(9053423., grad_fn=<MseLossBackward>)
output :  tensor([[158472.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2182267.5000, grad_fn=<MseLossBackward>)
output :  tensor([[121151.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0990e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136286.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(287916.0938, grad_fn=<MseLossBackward>)
output :  tensor([[181806.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(4809386., grad_fn=<MseLossBackward>)
output :  tensor([[199138.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(83517896., grad_fn=<MseLossBackward>)
output :  tensor([[239229.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4771e+09, grad_fn=<MseLossBackward>)
output :  tensor([[250720.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(39430944., grad_fn=<MseLossBackward>)
output :  tensor([[188401.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7056e+10, grad_fn=<MseLossBackward>)
output :  tensor([[142844.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6362e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150183.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(32301994., grad_fn=<MseLossBackward>)
output :  tensor([[71101.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6729e+08, grad_fn=<MseLossBackward>)
output :  tensor([[142849.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(61616856., grad_fn=<MseLossBackward>)
output :  tensor([[131007.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(4441951.5000, grad_fn=<MseLossBackward>)
output :  tensor([[155875.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(3515800.7500, grad_fn=<MseLossBackward>)
output :  tensor([[128651.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2725852.5000, grad_fn=<MseLossBackward>)
output :  tensor([[77786.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1655122.5000, grad_fn=<MseLossBackward>)
output :  tensor([[84217.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(4917167.5000, grad_fn=<MseLossBackward>)
output :  tensor([[227657.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(18861106., grad_fn=<MseLossBackward>)
output :  tensor([[140353.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7581e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131860.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1851385.3750, grad_fn=<MseLossBackward>)
output :  tensor([[170702.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(13708506., grad_fn=<MseLossBackward>)
output :  tensor([[237249.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(5060109.5000, grad_fn=<MseLossBackward>)
output :  tensor([[191179.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(923250.7500, grad_fn=<MseLossBackward>)
output :  tensor([[158048.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(4197248.5000, grad_fn=<MseLossBackward>)
output :  tensor([[199224.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1755459.3750, grad_fn=<MseLossBackward>)
output :  tensor([[207374.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7765e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137361.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(130614.4766, grad_fn=<MseLossBackward>)
output :  tensor([[155137.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(18923.4414, grad_fn=<MseLossBackward>)
output :  tensor([[134895.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1219471.6250, grad_fn=<MseLossBackward>)
output :  tensor([[199920.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(9.0478e+08, grad_fn=<MseLossBackward>)
output :  tensor([[154403.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(162913.1406, grad_fn=<MseLossBackward>)
output :  tensor([[136598.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8574e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145038.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(19234.2227, grad_fn=<MseLossBackward>)
output :  tensor([[207657.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(18854592., grad_fn=<MseLossBackward>)
output :  tensor([[101467.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7897e+08, grad_fn=<MseLossBackward>)
output :  tensor([[168503.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1007294.5000, grad_fn=<MseLossBackward>)
output :  tensor([[126296.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(2901965.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145760.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1536592.6250, grad_fn=<MseLossBackward>)
output :  tensor([[105017.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8177e+09, grad_fn=<MseLossBackward>)
output :  tensor([[139253.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(3075036.2500, grad_fn=<MseLossBackward>)
output :  tensor([[235616.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(147180.1250, grad_fn=<MseLossBackward>)
output :  tensor([[144631.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(135999.6094, grad_fn=<MseLossBackward>)
output :  tensor([[137593.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(8710.1387, grad_fn=<MseLossBackward>)
output :  tensor([[162998.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2249e+09, grad_fn=<MseLossBackward>)
output :  tensor([[270596.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(54806724., grad_fn=<MseLossBackward>)
output :  tensor([[175639.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(409400.0312, grad_fn=<MseLossBackward>)
output :  tensor([[105458.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(7198447., grad_fn=<MseLossBackward>)
output :  tensor([[200987.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8541e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159504.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(254488.7188, grad_fn=<MseLossBackward>)
output :  tensor([[162448.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6215e+10, grad_fn=<MseLossBackward>)
output :  tensor([[99010.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(505010.0938, grad_fn=<MseLossBackward>)
output :  tensor([[120579.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(9123279., grad_fn=<MseLossBackward>)
output :  tensor([[156208.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(43589.6094, grad_fn=<MseLossBackward>)
output :  tensor([[140994.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(988905.9375, grad_fn=<MseLossBackward>)
output :  tensor([[198812.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1410267.6250, grad_fn=<MseLossBackward>)
output :  tensor([[142747.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(558569.3750, grad_fn=<MseLossBackward>)
output :  tensor([[257805.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(20019192., grad_fn=<MseLossBackward>)
output :  tensor([[125149.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0336e+09, grad_fn=<MseLossBackward>)
output :  tensor([[165259.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(57817.7070, grad_fn=<MseLossBackward>)
output :  tensor([[186148.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(5527715.5000, grad_fn=<MseLossBackward>)
output :  tensor([[121910.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4186e+08, grad_fn=<MseLossBackward>)
output :  tensor([[252564.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(6578664., grad_fn=<MseLossBackward>)
output :  tensor([[158267.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2555e+08, grad_fn=<MseLossBackward>)
output :  tensor([[241996.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(11243447., grad_fn=<MseLossBackward>)
output :  tensor([[142587.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1994450., grad_fn=<MseLossBackward>)
output :  tensor([[208743.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1578674.5000, grad_fn=<MseLossBackward>)
output :  tensor([[175995.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(12925598., grad_fn=<MseLossBackward>)
output :  tensor([[154333.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(111357.7734, grad_fn=<MseLossBackward>)
output :  tensor([[124363.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(40497512., grad_fn=<MseLossBackward>)
output :  tensor([[238320.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3785e+09, grad_fn=<MseLossBackward>)
output :  tensor([[236804.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(10213417., grad_fn=<MseLossBackward>)
output :  tensor([[151972.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1863182.3750, grad_fn=<MseLossBackward>)
output :  tensor([[253442.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2123668.7500, grad_fn=<MseLossBackward>)
output :  tensor([[125348.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1760e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175133.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(750280.8125, grad_fn=<MseLossBackward>)
output :  tensor([[157926.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(4299143., grad_fn=<MseLossBackward>)
output :  tensor([[132386.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1921775.7500, grad_fn=<MseLossBackward>)
output :  tensor([[190832.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7617e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164909.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(827161.8125, grad_fn=<MseLossBackward>)
output :  tensor([[162049.]], grad_fn=<AddmmBackward>)
loss:  tensor(904401., grad_fn=<MseLossBackward>)
output :  tensor([[157213.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(618951., grad_fn=<MseLossBackward>)
output :  tensor([[146606.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(10847039., grad_fn=<MseLossBackward>)
output :  tensor([[171384.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8297e+09, grad_fn=<MseLossBackward>)
output :  tensor([[160786.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(619024.7500, grad_fn=<MseLossBackward>)
output :  tensor([[380574.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(11526662., grad_fn=<MseLossBackward>)
output :  tensor([[124624.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(5645264.5000, grad_fn=<MseLossBackward>)
output :  tensor([[130745.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0471e+09, grad_fn=<MseLossBackward>)
output :  tensor([[276233.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(24791996., grad_fn=<MseLossBackward>)
output :  tensor([[162531.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(282126.9688, grad_fn=<MseLossBackward>)
output :  tensor([[131556.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2225e+08, grad_fn=<MseLossBackward>)
output :  tensor([[228742.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(10612121., grad_fn=<MseLossBackward>)
output :  tensor([[183033.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(6418939., grad_fn=<MseLossBackward>)
output :  tensor([[152258.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(66572.0625, grad_fn=<MseLossBackward>)
output :  tensor([[144925.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(5578.2227, grad_fn=<MseLossBackward>)
output :  tensor([[152622.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4720e+08, grad_fn=<MseLossBackward>)
output :  tensor([[104019.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(16154810., grad_fn=<MseLossBackward>)
output :  tensor([[72526.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5692e+08, grad_fn=<MseLossBackward>)
output :  tensor([[164125.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(764039.8750, grad_fn=<MseLossBackward>)
output :  tensor([[190056.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4397e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161317.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(11005495., grad_fn=<MseLossBackward>)
output :  tensor([[153128.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(19106188., grad_fn=<MseLossBackward>)
output :  tensor([[138644.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1425971.8750, grad_fn=<MseLossBackward>)
output :  tensor([[204166.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(3181374., grad_fn=<MseLossBackward>)
output :  tensor([[139730.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2993440.7500, grad_fn=<MseLossBackward>)
output :  tensor([[182590.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6233e+10, grad_fn=<MseLossBackward>)
output :  tensor([[149168.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(10040779., grad_fn=<MseLossBackward>)
output :  tensor([[108792.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6527e+08, grad_fn=<MseLossBackward>)
output :  tensor([[93639.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(130315.3594, grad_fn=<MseLossBackward>)
output :  tensor([[173769.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1514745.5000, grad_fn=<MseLossBackward>)
output :  tensor([[256720.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(13541710., grad_fn=<MseLossBackward>)
output :  tensor([[143056.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2422449., grad_fn=<MseLossBackward>)
output :  tensor([[160413.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(269247.4688, grad_fn=<MseLossBackward>)
output :  tensor([[131699.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(640550.1250, grad_fn=<MseLossBackward>)
output :  tensor([[151394.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(3590255.2500, grad_fn=<MseLossBackward>)
output :  tensor([[169310.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1989422.1250, grad_fn=<MseLossBackward>)
output :  tensor([[128805.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(3259350.7500, grad_fn=<MseLossBackward>)
output :  tensor([[170387.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4452e+08, grad_fn=<MseLossBackward>)
output :  tensor([[158418.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2011566., grad_fn=<MseLossBackward>)
output :  tensor([[118383.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3547690., grad_fn=<MseLossBackward>)
output :  tensor([[160208.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2987e+09, grad_fn=<MseLossBackward>)
output :  tensor([[56094.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(16766850., grad_fn=<MseLossBackward>)
output :  tensor([[232210.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4464e+09, grad_fn=<MseLossBackward>)
output :  tensor([[201777.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(604263.3125, grad_fn=<MseLossBackward>)
output :  tensor([[184591.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(166987.1562, grad_fn=<MseLossBackward>)
output :  tensor([[106069.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(4768.5498, grad_fn=<MseLossBackward>)
output :  tensor([[86548.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(203556.0625, grad_fn=<MseLossBackward>)
output :  tensor([[138101.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(3603946.2500, grad_fn=<MseLossBackward>)
output :  tensor([[223169.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0170e+09, grad_fn=<MseLossBackward>)
output :  tensor([[206477.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1046497.0625, grad_fn=<MseLossBackward>)
output :  tensor([[169060.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(16487787., grad_fn=<MseLossBackward>)
output :  tensor([[175055.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0900e+09, grad_fn=<MseLossBackward>)
output :  tensor([[188796.]], grad_fn=<AddmmBackward>)
loss:  tensor(1449616., grad_fn=<MseLossBackward>)
output :  tensor([[88202.4922]], grad_fn=<AddmmBackward>)
loss:  tensor(1445987.5000, grad_fn=<MseLossBackward>)
output :  tensor([[137836.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(4679515.5000, grad_fn=<MseLossBackward>)
output :  tensor([[111103.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(364136.8125, grad_fn=<MseLossBackward>)
output :  tensor([[146295.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0682e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172832.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7500e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194825.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0351e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179235.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(584340.8125, grad_fn=<MseLossBackward>)
output :  tensor([[98457.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(3833672.2500, grad_fn=<MseLossBackward>)
output :  tensor([[118245.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(556434.4375, grad_fn=<MseLossBackward>)
output :  tensor([[161412.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1018e+08, grad_fn=<MseLossBackward>)
output :  tensor([[205499.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(30239516., grad_fn=<MseLossBackward>)
output :  tensor([[144213.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(45755.8828, grad_fn=<MseLossBackward>)
train_loss: [2.5734474e+09]
epoch_result tensor([0.])
output :  tensor([[157985.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(264437., grad_fn=<MseLossBackward>)
output :  tensor([[121846.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(23430.5215, grad_fn=<MseLossBackward>)
output :  tensor([[196620.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(5855870.5000, grad_fn=<MseLossBackward>)
output :  tensor([[176496.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(253764.0625, grad_fn=<MseLossBackward>)
output :  tensor([[151211.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1763e+08, grad_fn=<MseLossBackward>)
output :  tensor([[124806.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(10196247., grad_fn=<MseLossBackward>)
output :  tensor([[139352.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2713844.5000, grad_fn=<MseLossBackward>)
output :  tensor([[117923.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1159020.5000, grad_fn=<MseLossBackward>)
output :  tensor([[64570.9023]], grad_fn=<AddmmBackward>)
loss:  tensor(36855856., grad_fn=<MseLossBackward>)
output :  tensor([[166840.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(706597.8750, grad_fn=<MseLossBackward>)
output :  tensor([[131089.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(79391440., grad_fn=<MseLossBackward>)
output :  tensor([[223526.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2169867., grad_fn=<MseLossBackward>)
output :  tensor([[164531.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(19965538., grad_fn=<MseLossBackward>)
output :  tensor([[250164.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(216065.1875, grad_fn=<MseLossBackward>)
output :  tensor([[58742.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(14007300., grad_fn=<MseLossBackward>)
output :  tensor([[158487.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9565e+08, grad_fn=<MseLossBackward>)
output :  tensor([[183529.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(72757168., grad_fn=<MseLossBackward>)
output :  tensor([[151066.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(29519018., grad_fn=<MseLossBackward>)
output :  tensor([[270686.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(18603586., grad_fn=<MseLossBackward>)
output :  tensor([[194762.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(5007105.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139475.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4542e+10, grad_fn=<MseLossBackward>)
output :  tensor([[192934.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(892906.8750, grad_fn=<MseLossBackward>)
output :  tensor([[179958.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0197e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150256.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(552676.0625, grad_fn=<MseLossBackward>)
output :  tensor([[169585.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(171875.0156, grad_fn=<MseLossBackward>)
output :  tensor([[85074.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(106097.7969, grad_fn=<MseLossBackward>)
output :  tensor([[171116.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3775e+09, grad_fn=<MseLossBackward>)
output :  tensor([[187212.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(4895571., grad_fn=<MseLossBackward>)
output :  tensor([[210103.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0609e+09, grad_fn=<MseLossBackward>)
output :  tensor([[109415.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(341485., grad_fn=<MseLossBackward>)
output :  tensor([[172537.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2364002.2500, grad_fn=<MseLossBackward>)
output :  tensor([[137270.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(594368.7500, grad_fn=<MseLossBackward>)
output :  tensor([[128112.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(788113.9375, grad_fn=<MseLossBackward>)
output :  tensor([[121882.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(5676641.5000, grad_fn=<MseLossBackward>)
output :  tensor([[146048.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4384e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166406.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2080e+10, grad_fn=<MseLossBackward>)
output :  tensor([[147894.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(3261128., grad_fn=<MseLossBackward>)
output :  tensor([[180421.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(177477.8906, grad_fn=<MseLossBackward>)
output :  tensor([[142957.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(3832968.5000, grad_fn=<MseLossBackward>)
output :  tensor([[107667.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1213e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135703.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2880e+09, grad_fn=<MseLossBackward>)
output :  tensor([[130861.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(17126082., grad_fn=<MseLossBackward>)
output :  tensor([[137439.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0898e+08, grad_fn=<MseLossBackward>)
output :  tensor([[223478.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2314344.2500, grad_fn=<MseLossBackward>)
output :  tensor([[134544.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(5262866., grad_fn=<MseLossBackward>)
output :  tensor([[152284.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(10789891., grad_fn=<MseLossBackward>)
output :  tensor([[111782.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(47442.2852, grad_fn=<MseLossBackward>)
output :  tensor([[163009.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(9055021., grad_fn=<MseLossBackward>)
output :  tensor([[148487.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1634e+09, grad_fn=<MseLossBackward>)
output :  tensor([[190091.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(3643028.2500, grad_fn=<MseLossBackward>)
output :  tensor([[134691.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(58216.6406, grad_fn=<MseLossBackward>)
output :  tensor([[110454.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(206137.2812, grad_fn=<MseLossBackward>)
output :  tensor([[231794.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(4863058.5000, grad_fn=<MseLossBackward>)
output :  tensor([[169508.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9343e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159987.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(975557.4375, grad_fn=<MseLossBackward>)
output :  tensor([[202728.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8822e+10, grad_fn=<MseLossBackward>)
output :  tensor([[247973.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1242e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143884.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(147996.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135094.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1198203.8750, grad_fn=<MseLossBackward>)
output :  tensor([[155559.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(312813., grad_fn=<MseLossBackward>)
output :  tensor([[133507.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(12302118., grad_fn=<MseLossBackward>)
output :  tensor([[179611.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4623e+09, grad_fn=<MseLossBackward>)
output :  tensor([[183007.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1192771.1250, grad_fn=<MseLossBackward>)
output :  tensor([[161694.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(37903.2227, grad_fn=<MseLossBackward>)
output :  tensor([[135199.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(60843900., grad_fn=<MseLossBackward>)
output :  tensor([[143221.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(520855.4062, grad_fn=<MseLossBackward>)
output :  tensor([[150170.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(26733908., grad_fn=<MseLossBackward>)
output :  tensor([[174278.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2781e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193797.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3835e+08, grad_fn=<MseLossBackward>)
output :  tensor([[138063.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2444385.7500, grad_fn=<MseLossBackward>)
output :  tensor([[176314.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(19487396., grad_fn=<MseLossBackward>)
output :  tensor([[176917.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(16670379., grad_fn=<MseLossBackward>)
output :  tensor([[116601.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2564251.7500, grad_fn=<MseLossBackward>)
output :  tensor([[215491.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(30343228., grad_fn=<MseLossBackward>)
output :  tensor([[181220.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(5195408., grad_fn=<MseLossBackward>)
output :  tensor([[127952.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(6012955.5000, grad_fn=<MseLossBackward>)
output :  tensor([[197338.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(703711.2500, grad_fn=<MseLossBackward>)
output :  tensor([[176637.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(3020535.5000, grad_fn=<MseLossBackward>)
output :  tensor([[211127.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0668e+10, grad_fn=<MseLossBackward>)
output :  tensor([[210858.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(19986.8906, grad_fn=<MseLossBackward>)
output :  tensor([[164926.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1510e+09, grad_fn=<MseLossBackward>)
output :  tensor([[196218.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2953940.5000, grad_fn=<MseLossBackward>)
output :  tensor([[116547.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(12585532., grad_fn=<MseLossBackward>)
output :  tensor([[115613.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(9695682., grad_fn=<MseLossBackward>)
output :  tensor([[111108.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(795023., grad_fn=<MseLossBackward>)
output :  tensor([[148449.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2720953.2500, grad_fn=<MseLossBackward>)
output :  tensor([[158771.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3809e+10, grad_fn=<MseLossBackward>)
output :  tensor([[182880.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(8295750., grad_fn=<MseLossBackward>)
output :  tensor([[129356.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(3448275., grad_fn=<MseLossBackward>)
output :  tensor([[145482.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(232911.8125, grad_fn=<MseLossBackward>)
output :  tensor([[184457.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4559e+09, grad_fn=<MseLossBackward>)
output :  tensor([[121544.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(21572178., grad_fn=<MseLossBackward>)
output :  tensor([[195888.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1235015.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145236.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(56035.7656, grad_fn=<MseLossBackward>)
output :  tensor([[216347.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(11886765., grad_fn=<MseLossBackward>)
output :  tensor([[126572.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(327291.2500, grad_fn=<MseLossBackward>)
output :  tensor([[246146.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(4756965.5000, grad_fn=<MseLossBackward>)
output :  tensor([[239360.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0830e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144400.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6902e+08, grad_fn=<MseLossBackward>)
output :  tensor([[84181.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3739e+08, grad_fn=<MseLossBackward>)
output :  tensor([[197915.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9266e+09, grad_fn=<MseLossBackward>)
output :  tensor([[77187.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(14537241., grad_fn=<MseLossBackward>)
output :  tensor([[139907.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(166234.5781, grad_fn=<MseLossBackward>)
output :  tensor([[77157.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2748497.7500, grad_fn=<MseLossBackward>)
output :  tensor([[144718.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3117100.5000, grad_fn=<MseLossBackward>)
output :  tensor([[174681.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1738236.2500, grad_fn=<MseLossBackward>)
output :  tensor([[155478.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(3912978.5000, grad_fn=<MseLossBackward>)
output :  tensor([[108524.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(1264447.5000, grad_fn=<MseLossBackward>)
output :  tensor([[205342.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2190e+10, grad_fn=<MseLossBackward>)
output :  tensor([[126454.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(4186020., grad_fn=<MseLossBackward>)
output :  tensor([[271121.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(78829424., grad_fn=<MseLossBackward>)
output :  tensor([[298985.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2132e+08, grad_fn=<MseLossBackward>)
output :  tensor([[109771.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(5161948.5000, grad_fn=<MseLossBackward>)
output :  tensor([[170610.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(3571568.5000, grad_fn=<MseLossBackward>)
output :  tensor([[133230.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3657e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134132.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(23689970., grad_fn=<MseLossBackward>)
output :  tensor([[131831.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2500697.5000, grad_fn=<MseLossBackward>)
output :  tensor([[122713.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(5226617.5000, grad_fn=<MseLossBackward>)
output :  tensor([[133901.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9544e+08, grad_fn=<MseLossBackward>)
output :  tensor([[226517.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8606e+10, grad_fn=<MseLossBackward>)
output :  tensor([[189535.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2942e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144820.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(847550.3750, grad_fn=<MseLossBackward>)
output :  tensor([[125666.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(3362324., grad_fn=<MseLossBackward>)
output :  tensor([[109160.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(4367022.5000, grad_fn=<MseLossBackward>)
output :  tensor([[258967.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4920e+09, grad_fn=<MseLossBackward>)
output :  tensor([[138532.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(12478998., grad_fn=<MseLossBackward>)
output :  tensor([[206431.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(11774871., grad_fn=<MseLossBackward>)
output :  tensor([[107584.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(7206204.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138763.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1408931.8750, grad_fn=<MseLossBackward>)
output :  tensor([[209846.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1474e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180524.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(389824.6250, grad_fn=<MseLossBackward>)
output :  tensor([[186095.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1199709.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163065.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1297e+10, grad_fn=<MseLossBackward>)
output :  tensor([[303076.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0191e+09, grad_fn=<MseLossBackward>)
output :  tensor([[196245.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2736905., grad_fn=<MseLossBackward>)
output :  tensor([[259318.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0604e+10, grad_fn=<MseLossBackward>)
output :  tensor([[222203.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9181e+09, grad_fn=<MseLossBackward>)
output :  tensor([[284787.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0376e+09, grad_fn=<MseLossBackward>)
output :  tensor([[221167.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(8023676., grad_fn=<MseLossBackward>)
output :  tensor([[222051.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8883e+10, grad_fn=<MseLossBackward>)
output :  tensor([[196776.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(49847.5391, grad_fn=<MseLossBackward>)
output :  tensor([[158082.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4579e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130946.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(2412512.7500, grad_fn=<MseLossBackward>)
output :  tensor([[135642.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(20368.6406, grad_fn=<MseLossBackward>)
output :  tensor([[90530.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(220657.7188, grad_fn=<MseLossBackward>)
output :  tensor([[107472.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(278157.3438, grad_fn=<MseLossBackward>)
output :  tensor([[272990.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1259e+09, grad_fn=<MseLossBackward>)
output :  tensor([[236361.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1854788.6250, grad_fn=<MseLossBackward>)
output :  tensor([[146921.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(3693183., grad_fn=<MseLossBackward>)
output :  tensor([[138855.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1838566.5000, grad_fn=<MseLossBackward>)
output :  tensor([[172781.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(906066., grad_fn=<MseLossBackward>)
output :  tensor([[147585.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(5455290., grad_fn=<MseLossBackward>)
output :  tensor([[164946.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7343e+08, grad_fn=<MseLossBackward>)
output :  tensor([[164961.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1476.2405, grad_fn=<MseLossBackward>)
output :  tensor([[140852.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(14838506., grad_fn=<MseLossBackward>)
output :  tensor([[189391.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4744e+09, grad_fn=<MseLossBackward>)
output :  tensor([[111590.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(167498.3594, grad_fn=<MseLossBackward>)
output :  tensor([[171812.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(35308.7578, grad_fn=<MseLossBackward>)
output :  tensor([[122781.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(7738872., grad_fn=<MseLossBackward>)
output :  tensor([[89454.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(6026066., grad_fn=<MseLossBackward>)
output :  tensor([[178051.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3797017.5000, grad_fn=<MseLossBackward>)
output :  tensor([[111420.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2311065., grad_fn=<MseLossBackward>)
output :  tensor([[238620.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(143925.3906, grad_fn=<MseLossBackward>)
output :  tensor([[245441.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(195087.8438, grad_fn=<MseLossBackward>)
output :  tensor([[135566.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(36803372., grad_fn=<MseLossBackward>)
output :  tensor([[112439.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(12110835., grad_fn=<MseLossBackward>)
output :  tensor([[287419.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2420e+10, grad_fn=<MseLossBackward>)
output :  tensor([[172690.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1417327.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128304.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(10922767., grad_fn=<MseLossBackward>)
output :  tensor([[143374.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4386e+08, grad_fn=<MseLossBackward>)
output :  tensor([[202561.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3083e+08, grad_fn=<MseLossBackward>)
output :  tensor([[141323.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(104895.0156, grad_fn=<MseLossBackward>)
output :  tensor([[154987.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5628e+10, grad_fn=<MseLossBackward>)
output :  tensor([[156759.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(8178617., grad_fn=<MseLossBackward>)
output :  tensor([[131937.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(5942320.5000, grad_fn=<MseLossBackward>)
output :  tensor([[248845.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6810e+10, grad_fn=<MseLossBackward>)
output :  tensor([[403018.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1037024., grad_fn=<MseLossBackward>)
output :  tensor([[110962.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(3849597.2500, grad_fn=<MseLossBackward>)
output :  tensor([[112312.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(38282064., grad_fn=<MseLossBackward>)
output :  tensor([[159485.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(210.2500, grad_fn=<MseLossBackward>)
output :  tensor([[130456.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5428e+08, grad_fn=<MseLossBackward>)
output :  tensor([[161989.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6013e+09, grad_fn=<MseLossBackward>)
output :  tensor([[172091.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8554e+09, grad_fn=<MseLossBackward>)
output :  tensor([[103979.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(143901.6875, grad_fn=<MseLossBackward>)
output :  tensor([[138573.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(5886386., grad_fn=<MseLossBackward>)
output :  tensor([[363895.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(11547891., grad_fn=<MseLossBackward>)
output :  tensor([[207164.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1936e+09, grad_fn=<MseLossBackward>)
output :  tensor([[175423.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(5825.9824, grad_fn=<MseLossBackward>)
output :  tensor([[206488.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(12878678., grad_fn=<MseLossBackward>)
output :  tensor([[139833.]], grad_fn=<AddmmBackward>)
loss:  tensor(693889., grad_fn=<MseLossBackward>)
output :  tensor([[193017.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2197806.2500, grad_fn=<MseLossBackward>)
output :  tensor([[133847.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9419e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179987.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1025346.1250, grad_fn=<MseLossBackward>)
output :  tensor([[238911.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(9541342., grad_fn=<MseLossBackward>)
output :  tensor([[171505.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(6224245.5000, grad_fn=<MseLossBackward>)
output :  tensor([[109432.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(2052526.3750, grad_fn=<MseLossBackward>)
output :  tensor([[261655.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(8442657., grad_fn=<MseLossBackward>)
output :  tensor([[248575.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2028310., grad_fn=<MseLossBackward>)
output :  tensor([[120975.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(4100055.5000, grad_fn=<MseLossBackward>)
output :  tensor([[217099.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3524e+09, grad_fn=<MseLossBackward>)
output :  tensor([[306475.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5436e+08, grad_fn=<MseLossBackward>)
output :  tensor([[207727.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(528778.9375, grad_fn=<MseLossBackward>)
output :  tensor([[216194.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5328e+10, grad_fn=<MseLossBackward>)
output :  tensor([[157858.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1715.7717, grad_fn=<MseLossBackward>)
output :  tensor([[170346.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(126836.1484, grad_fn=<MseLossBackward>)
output :  tensor([[158011.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1165219., grad_fn=<MseLossBackward>)
output :  tensor([[171211.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1467808., grad_fn=<MseLossBackward>)
output :  tensor([[238484.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7118e+08, grad_fn=<MseLossBackward>)
output :  tensor([[224554.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(24021792., grad_fn=<MseLossBackward>)
output :  tensor([[159298.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5125e+08, grad_fn=<MseLossBackward>)
output :  tensor([[121466.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2352197.2500, grad_fn=<MseLossBackward>)
output :  tensor([[176636.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(131859.7656, grad_fn=<MseLossBackward>)
output :  tensor([[177865.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7461e+09, grad_fn=<MseLossBackward>)
output :  tensor([[207936.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4850e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134867.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(189524.1875, grad_fn=<MseLossBackward>)
output :  tensor([[148586.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2828e+08, grad_fn=<MseLossBackward>)
output :  tensor([[276201.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(637752., grad_fn=<MseLossBackward>)
output :  tensor([[84316.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(466915.9688, grad_fn=<MseLossBackward>)
output :  tensor([[237425.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(857418.1250, grad_fn=<MseLossBackward>)
output :  tensor([[260466.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0398e+11, grad_fn=<MseLossBackward>)
output :  tensor([[173766.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(14189230., grad_fn=<MseLossBackward>)
output :  tensor([[195667.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5471e+09, grad_fn=<MseLossBackward>)
output :  tensor([[156109.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1230435.5000, grad_fn=<MseLossBackward>)
output :  tensor([[208593.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7707e+09, grad_fn=<MseLossBackward>)
output :  tensor([[127574.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2032896.7500, grad_fn=<MseLossBackward>)
output :  tensor([[148789.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(14361139., grad_fn=<MseLossBackward>)
output :  tensor([[171748.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5549e+08, grad_fn=<MseLossBackward>)
output :  tensor([[185031.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(669712.0625, grad_fn=<MseLossBackward>)
output :  tensor([[133190.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(51699244., grad_fn=<MseLossBackward>)
output :  tensor([[138607.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(4441885.5000, grad_fn=<MseLossBackward>)
output :  tensor([[174461.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2136119.2500, grad_fn=<MseLossBackward>)
output :  tensor([[199076.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5933e+09, grad_fn=<MseLossBackward>)
output :  tensor([[240533.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(6082774.5000, grad_fn=<MseLossBackward>)
output :  tensor([[151542.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(11955495., grad_fn=<MseLossBackward>)
output :  tensor([[196813.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(661273.9375, grad_fn=<MseLossBackward>)
output :  tensor([[161829.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1788e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180306.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(650896., grad_fn=<MseLossBackward>)
output :  tensor([[179731.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(28397.5156, grad_fn=<MseLossBackward>)
output :  tensor([[95059.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(3766480.2500, grad_fn=<MseLossBackward>)
output :  tensor([[171693.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1730e+10, grad_fn=<MseLossBackward>)
output :  tensor([[133119.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(3535751.5000, grad_fn=<MseLossBackward>)
output :  tensor([[119656.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(21683210., grad_fn=<MseLossBackward>)
output :  tensor([[168690.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(28193114., grad_fn=<MseLossBackward>)
output :  tensor([[85209.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(43942.6406, grad_fn=<MseLossBackward>)
output :  tensor([[283079.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(47893320., grad_fn=<MseLossBackward>)
output :  tensor([[166769.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3130356.2500, grad_fn=<MseLossBackward>)
output :  tensor([[193558.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9491e+10, grad_fn=<MseLossBackward>)
output :  tensor([[247130.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6975e+08, grad_fn=<MseLossBackward>)
output :  tensor([[154965.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(15727917., grad_fn=<MseLossBackward>)
output :  tensor([[122957.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(1087213.5000, grad_fn=<MseLossBackward>)
output :  tensor([[120342.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(196179.7812, grad_fn=<MseLossBackward>)
output :  tensor([[145123.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(9.0741e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176824.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(7977800., grad_fn=<MseLossBackward>)
output :  tensor([[110734.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9719e+08, grad_fn=<MseLossBackward>)
output :  tensor([[211817.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1275e+10, grad_fn=<MseLossBackward>)
output :  tensor([[240594.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(819307.8125, grad_fn=<MseLossBackward>)
output :  tensor([[253577.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0055e+10, grad_fn=<MseLossBackward>)
output :  tensor([[221218.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1617e+08, grad_fn=<MseLossBackward>)
output :  tensor([[197516.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3920e+10, grad_fn=<MseLossBackward>)
output :  tensor([[190140.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(6970012.5000, grad_fn=<MseLossBackward>)
output :  tensor([[207728.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7150e+10, grad_fn=<MseLossBackward>)
output :  tensor([[191038.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1014e+10, grad_fn=<MseLossBackward>)
output :  tensor([[176660.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(4325360., grad_fn=<MseLossBackward>)
output :  tensor([[152805.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(648830.2500, grad_fn=<MseLossBackward>)
output :  tensor([[331977.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(25228332., grad_fn=<MseLossBackward>)
output :  tensor([[210621.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1900865.3750, grad_fn=<MseLossBackward>)
output :  tensor([[160278.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(77623.1875, grad_fn=<MseLossBackward>)
output :  tensor([[189782.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6747e+09, grad_fn=<MseLossBackward>)
output :  tensor([[103730.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1611947.6250, grad_fn=<MseLossBackward>)
output :  tensor([[277611.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6944e+10, grad_fn=<MseLossBackward>)
output :  tensor([[172488.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1993611.6250, grad_fn=<MseLossBackward>)
output :  tensor([[218370.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(23721010., grad_fn=<MseLossBackward>)
output :  tensor([[213723.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(52952456., grad_fn=<MseLossBackward>)
output :  tensor([[178019.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1392658.1250, grad_fn=<MseLossBackward>)
output :  tensor([[197560.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(17970180., grad_fn=<MseLossBackward>)
output :  tensor([[151516.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(12135970., grad_fn=<MseLossBackward>)
output :  tensor([[147674.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2729e+09, grad_fn=<MseLossBackward>)
output :  tensor([[119306.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(650832.9375, grad_fn=<MseLossBackward>)
output :  tensor([[141039.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1080235.3750, grad_fn=<MseLossBackward>)
output :  tensor([[151082.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(4335765., grad_fn=<MseLossBackward>)
output :  tensor([[202592.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5727e+10, grad_fn=<MseLossBackward>)
output :  tensor([[161327.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(3341184.2500, grad_fn=<MseLossBackward>)
output :  tensor([[100421.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(849075.8750, grad_fn=<MseLossBackward>)
output :  tensor([[227197.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6390e+08, grad_fn=<MseLossBackward>)
output :  tensor([[184932.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7764e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176188.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(87717.7812, grad_fn=<MseLossBackward>)
output :  tensor([[88141.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(37715624., grad_fn=<MseLossBackward>)
output :  tensor([[129990.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2221683.5000, grad_fn=<MseLossBackward>)
output :  tensor([[217680.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(13544930., grad_fn=<MseLossBackward>)
output :  tensor([[143728.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(73873.5391, grad_fn=<MseLossBackward>)
output :  tensor([[130912.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(833198.1250, grad_fn=<MseLossBackward>)
output :  tensor([[145647.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(9288685., grad_fn=<MseLossBackward>)
output :  tensor([[176583.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5275e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144283.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(80195.1562, grad_fn=<MseLossBackward>)
output :  tensor([[159829.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(29032.9648, grad_fn=<MseLossBackward>)
output :  tensor([[215638.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(407103.8125, grad_fn=<MseLossBackward>)
output :  tensor([[135425.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2573e+08, grad_fn=<MseLossBackward>)
output :  tensor([[259700.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(22093672., grad_fn=<MseLossBackward>)
output :  tensor([[158869.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(398062.4062, grad_fn=<MseLossBackward>)
output :  tensor([[129679.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(1390243.6250, grad_fn=<MseLossBackward>)
output :  tensor([[95643.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(413680.1250, grad_fn=<MseLossBackward>)
output :  tensor([[151765.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5246e+09, grad_fn=<MseLossBackward>)
output :  tensor([[175908.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(15931199., grad_fn=<MseLossBackward>)
output :  tensor([[119795.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(496474.3750, grad_fn=<MseLossBackward>)
output :  tensor([[191376.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4117e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145272.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3260e+09, grad_fn=<MseLossBackward>)
output :  tensor([[149487.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(170259.3906, grad_fn=<MseLossBackward>)
output :  tensor([[187580.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(28820.3672, grad_fn=<MseLossBackward>)
output :  tensor([[250169.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8411e+09, grad_fn=<MseLossBackward>)
output :  tensor([[89461.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(4157361.7500, grad_fn=<MseLossBackward>)
output :  tensor([[240277.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(77240.5703, grad_fn=<MseLossBackward>)
output :  tensor([[128273.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(51227.9570, grad_fn=<MseLossBackward>)
output :  tensor([[167590.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6647e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113764.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8945e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177717.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2951040.7500, grad_fn=<MseLossBackward>)
output :  tensor([[164148.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1249e+08, grad_fn=<MseLossBackward>)
output :  tensor([[152607.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8876e+08, grad_fn=<MseLossBackward>)
output :  tensor([[240265.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1602162.6250, grad_fn=<MseLossBackward>)
output :  tensor([[224007.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1555e+09, grad_fn=<MseLossBackward>)
output :  tensor([[127962.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(926692., grad_fn=<MseLossBackward>)
output :  tensor([[128905.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(8440387., grad_fn=<MseLossBackward>)
output :  tensor([[225176.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3324468.5000, grad_fn=<MseLossBackward>)
output :  tensor([[227206.]], grad_fn=<AddmmBackward>)
loss:  tensor(46158436., grad_fn=<MseLossBackward>)
output :  tensor([[228213.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2290540.2500, grad_fn=<MseLossBackward>)
output :  tensor([[146206.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(3218155.7500, grad_fn=<MseLossBackward>)
output :  tensor([[211883.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3545806.7500, grad_fn=<MseLossBackward>)
output :  tensor([[132748.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6251e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130408.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(4375679.5000, grad_fn=<MseLossBackward>)
output :  tensor([[308091.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(47732552., grad_fn=<MseLossBackward>)
output :  tensor([[143249.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(5059899., grad_fn=<MseLossBackward>)
output :  tensor([[121744.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9969e+09, grad_fn=<MseLossBackward>)
output :  tensor([[109520.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(429.2666, grad_fn=<MseLossBackward>)
output :  tensor([[158077.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0800e+08, grad_fn=<MseLossBackward>)
output :  tensor([[182020.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5942e+09, grad_fn=<MseLossBackward>)
output :  tensor([[175403.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(5778014., grad_fn=<MseLossBackward>)
output :  tensor([[192397.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(74008648., grad_fn=<MseLossBackward>)
output :  tensor([[95728.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(18245846., grad_fn=<MseLossBackward>)
output :  tensor([[178299.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(490831.5938, grad_fn=<MseLossBackward>)
output :  tensor([[168483.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(340271.6875, grad_fn=<MseLossBackward>)
output :  tensor([[136392.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(6799708., grad_fn=<MseLossBackward>)
output :  tensor([[259989.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(9.8229e+09, grad_fn=<MseLossBackward>)
output :  tensor([[142366.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2909e+09, grad_fn=<MseLossBackward>)
output :  tensor([[175181.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(4760510.5000, grad_fn=<MseLossBackward>)
output :  tensor([[142699.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(7289072., grad_fn=<MseLossBackward>)
output :  tensor([[199137.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1855810.2500, grad_fn=<MseLossBackward>)
output :  tensor([[167481.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(6343629.5000, grad_fn=<MseLossBackward>)
output :  tensor([[243500.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(249625.1406, grad_fn=<MseLossBackward>)
output :  tensor([[133288.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1467126.5000, grad_fn=<MseLossBackward>)
output :  tensor([[150112.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(581072.6875, grad_fn=<MseLossBackward>)
output :  tensor([[212641.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(5564144., grad_fn=<MseLossBackward>)
output :  tensor([[161250.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(14055352., grad_fn=<MseLossBackward>)
output :  tensor([[195333.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(40111044., grad_fn=<MseLossBackward>)
output :  tensor([[131489.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5680e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129565.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(319843.2812, grad_fn=<MseLossBackward>)
output :  tensor([[142806.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(7878898., grad_fn=<MseLossBackward>)
output :  tensor([[203231.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3915e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166800.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6833e+09, grad_fn=<MseLossBackward>)
output :  tensor([[72381.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5330e+08, grad_fn=<MseLossBackward>)
output :  tensor([[92212.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(59489644., grad_fn=<MseLossBackward>)
output :  tensor([[251117.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(4734024., grad_fn=<MseLossBackward>)
output :  tensor([[204885.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3409e+09, grad_fn=<MseLossBackward>)
output :  tensor([[115442.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(196193.6250, grad_fn=<MseLossBackward>)
output :  tensor([[159059.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0886e+08, grad_fn=<MseLossBackward>)
output :  tensor([[212359.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(58382492., grad_fn=<MseLossBackward>)
output :  tensor([[181905.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7606e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158684.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(13576116., grad_fn=<MseLossBackward>)
output :  tensor([[167631.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(5608312., grad_fn=<MseLossBackward>)
output :  tensor([[114494.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(255806.7656, grad_fn=<MseLossBackward>)
output :  tensor([[158950.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(15603241., grad_fn=<MseLossBackward>)
output :  tensor([[192560.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0562e+08, grad_fn=<MseLossBackward>)
output :  tensor([[217420.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4325880., grad_fn=<MseLossBackward>)
output :  tensor([[248225.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4678e+11, grad_fn=<MseLossBackward>)
output :  tensor([[148874.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(3515449.2500, grad_fn=<MseLossBackward>)
output :  tensor([[107857.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(387486.8125, grad_fn=<MseLossBackward>)
output :  tensor([[170797.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2326e+08, grad_fn=<MseLossBackward>)
output :  tensor([[150917.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(174175.8125, grad_fn=<MseLossBackward>)
output :  tensor([[230942.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(36690656., grad_fn=<MseLossBackward>)
output :  tensor([[114400.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(358875.8750, grad_fn=<MseLossBackward>)
output :  tensor([[179679.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(10369205., grad_fn=<MseLossBackward>)
output :  tensor([[189288.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(6702274., grad_fn=<MseLossBackward>)
output :  tensor([[166481.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3568e+10, grad_fn=<MseLossBackward>)
output :  tensor([[93561.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5779e+08, grad_fn=<MseLossBackward>)
output :  tensor([[235626.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(11377340., grad_fn=<MseLossBackward>)
output :  tensor([[178740.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(7512652.5000, grad_fn=<MseLossBackward>)
output :  tensor([[142917.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(8510439., grad_fn=<MseLossBackward>)
output :  tensor([[234918.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(6591.4102, grad_fn=<MseLossBackward>)
output :  tensor([[165838.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(8058856.5000, grad_fn=<MseLossBackward>)
output :  tensor([[205762.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4218e+10, grad_fn=<MseLossBackward>)
output :  tensor([[136284.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1649980.3750, grad_fn=<MseLossBackward>)
output :  tensor([[188909.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2413e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136803.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(645386.3125, grad_fn=<MseLossBackward>)
output :  tensor([[228070.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(62882916., grad_fn=<MseLossBackward>)
output :  tensor([[229638.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1458e+08, grad_fn=<MseLossBackward>)
output :  tensor([[90296.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(87648.3750, grad_fn=<MseLossBackward>)
output :  tensor([[159529.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(9180.0352, grad_fn=<MseLossBackward>)
output :  tensor([[249754.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4671e+10, grad_fn=<MseLossBackward>)
output :  tensor([[147946.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(8683796., grad_fn=<MseLossBackward>)
output :  tensor([[109736.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8264e+09, grad_fn=<MseLossBackward>)
output :  tensor([[165142.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(413127.5625, grad_fn=<MseLossBackward>)
output :  tensor([[149429.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(29476756., grad_fn=<MseLossBackward>)
output :  tensor([[129194.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(988113.6875, grad_fn=<MseLossBackward>)
output :  tensor([[189319.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8553e+09, grad_fn=<MseLossBackward>)
output :  tensor([[123673.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(1376497.2500, grad_fn=<MseLossBackward>)
output :  tensor([[150706.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1672697.6250, grad_fn=<MseLossBackward>)
output :  tensor([[168471.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(10751329., grad_fn=<MseLossBackward>)
output :  tensor([[151215.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(46581.7812, grad_fn=<MseLossBackward>)
output :  tensor([[161423.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2180929., grad_fn=<MseLossBackward>)
output :  tensor([[134910.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7136e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134133.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(4552355.5000, grad_fn=<MseLossBackward>)
output :  tensor([[154739.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4774e+08, grad_fn=<MseLossBackward>)
output :  tensor([[143963.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(35496.9141, grad_fn=<MseLossBackward>)
output :  tensor([[161290.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(211197.6875, grad_fn=<MseLossBackward>)
output :  tensor([[135828.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7230e+08, grad_fn=<MseLossBackward>)
output :  tensor([[151023.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(4944369., grad_fn=<MseLossBackward>)
output :  tensor([[187126.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(763466.3750, grad_fn=<MseLossBackward>)
output :  tensor([[170057.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1119198.7500, grad_fn=<MseLossBackward>)
output :  tensor([[178700.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1688578.3750, grad_fn=<MseLossBackward>)
output :  tensor([[217040.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(8759935., grad_fn=<MseLossBackward>)
output :  tensor([[112905.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(25054560., grad_fn=<MseLossBackward>)
output :  tensor([[134581.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(93729328., grad_fn=<MseLossBackward>)
output :  tensor([[285880.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(14213.1104, grad_fn=<MseLossBackward>)
output :  tensor([[117222.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(1493723.2500, grad_fn=<MseLossBackward>)
output :  tensor([[177230.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8292e+09, grad_fn=<MseLossBackward>)
output :  tensor([[186883.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(3548396.2500, grad_fn=<MseLossBackward>)
output :  tensor([[186102.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(363269.9062, grad_fn=<MseLossBackward>)
output :  tensor([[250546.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9800e+08, grad_fn=<MseLossBackward>)
output :  tensor([[221945.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2968.5471, grad_fn=<MseLossBackward>)
output :  tensor([[122588.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7850e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173870.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3560e+08, grad_fn=<MseLossBackward>)
output :  tensor([[125649.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2721211., grad_fn=<MseLossBackward>)
output :  tensor([[183550.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5142e+10, grad_fn=<MseLossBackward>)
output :  tensor([[157449.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(19800692., grad_fn=<MseLossBackward>)
output :  tensor([[154228.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(59724884., grad_fn=<MseLossBackward>)
output :  tensor([[208483.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(4768559.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145000.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5625e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175037.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(927038., grad_fn=<MseLossBackward>)
output :  tensor([[253706.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6532e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148702.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(492979.5000, grad_fn=<MseLossBackward>)
output :  tensor([[203059.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(156012.6562, grad_fn=<MseLossBackward>)
output :  tensor([[163217.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(10677067., grad_fn=<MseLossBackward>)
output :  tensor([[120534.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0585e+09, grad_fn=<MseLossBackward>)
output :  tensor([[135924.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(30373.9531, grad_fn=<MseLossBackward>)
output :  tensor([[184783.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(613798.8125, grad_fn=<MseLossBackward>)
output :  tensor([[196383.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(40751468., grad_fn=<MseLossBackward>)
output :  tensor([[232591.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1819e+09, grad_fn=<MseLossBackward>)
output :  tensor([[251714.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(27941630., grad_fn=<MseLossBackward>)
output :  tensor([[190633.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6478e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143128.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6655e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145351.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(725850.7500, grad_fn=<MseLossBackward>)
output :  tensor([[72492.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0557e+09, grad_fn=<MseLossBackward>)
output :  tensor([[130763.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(17943960., grad_fn=<MseLossBackward>)
output :  tensor([[126291.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(6802479., grad_fn=<MseLossBackward>)
output :  tensor([[156005.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(4023158.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128213.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1471634.3750, grad_fn=<MseLossBackward>)
output :  tensor([[77964.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2143890.7500, grad_fn=<MseLossBackward>)
output :  tensor([[83806.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(3263668., grad_fn=<MseLossBackward>)
output :  tensor([[238970.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(48587000., grad_fn=<MseLossBackward>)
output :  tensor([[139227.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1438e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130431.]], grad_fn=<AddmmBackward>)
loss:  tensor(4761., grad_fn=<MseLossBackward>)
output :  tensor([[169342.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(5486647.5000, grad_fn=<MseLossBackward>)
output :  tensor([[234798.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(40476.4102, grad_fn=<MseLossBackward>)
output :  tensor([[184953.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(51650724., grad_fn=<MseLossBackward>)
output :  tensor([[155466.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(284922.4375, grad_fn=<MseLossBackward>)
output :  tensor([[196451.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2098876.5000, grad_fn=<MseLossBackward>)
output :  tensor([[204425.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0611e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137879.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(773382.8125, grad_fn=<MseLossBackward>)
output :  tensor([[152717.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(5207595.5000, grad_fn=<MseLossBackward>)
output :  tensor([[133468.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(6407622., grad_fn=<MseLossBackward>)
output :  tensor([[202104.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7818e+08, grad_fn=<MseLossBackward>)
output :  tensor([[153237.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(581430.0625, grad_fn=<MseLossBackward>)
output :  tensor([[136555.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8538e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144317.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(339816.1250, grad_fn=<MseLossBackward>)
output :  tensor([[208600.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(11556282., grad_fn=<MseLossBackward>)
output :  tensor([[99621.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1052e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163966.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(12486947., grad_fn=<MseLossBackward>)
output :  tensor([[126755.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1548624.7500, grad_fn=<MseLossBackward>)
output :  tensor([[148058.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1120720., grad_fn=<MseLossBackward>)
output :  tensor([[104666.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7879e+09, grad_fn=<MseLossBackward>)
output :  tensor([[138124.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(389649.0625, grad_fn=<MseLossBackward>)
output :  tensor([[232726.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(10716211., grad_fn=<MseLossBackward>)
output :  tensor([[145268.]], grad_fn=<AddmmBackward>)
loss:  tensor(71824., grad_fn=<MseLossBackward>)
output :  tensor([[137605.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(11179.7578, grad_fn=<MseLossBackward>)
output :  tensor([[164875.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3598e+09, grad_fn=<MseLossBackward>)
output :  tensor([[273892.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(16873354., grad_fn=<MseLossBackward>)
output :  tensor([[176727.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2985390., grad_fn=<MseLossBackward>)
output :  tensor([[103321.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(297936.8750, grad_fn=<MseLossBackward>)
output :  tensor([[202172.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6742e+09, grad_fn=<MseLossBackward>)
output :  tensor([[156358.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(6978017.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162951.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5999e+10, grad_fn=<MseLossBackward>)
output :  tensor([[98914.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(377466.2500, grad_fn=<MseLossBackward>)
output :  tensor([[125065.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(2148629.2500, grad_fn=<MseLossBackward>)
output :  tensor([[154150.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(3419263.2500, grad_fn=<MseLossBackward>)
output :  tensor([[141437.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2067574.3750, grad_fn=<MseLossBackward>)
output :  tensor([[200559.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(313337.5625, grad_fn=<MseLossBackward>)
output :  tensor([[136465.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(30626366., grad_fn=<MseLossBackward>)
output :  tensor([[261573.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(499694.3438, grad_fn=<MseLossBackward>)
output :  tensor([[126376.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1140e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163941.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2429312., grad_fn=<MseLossBackward>)
output :  tensor([[188381.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(14023.7402, grad_fn=<MseLossBackward>)
output :  tensor([[122669.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6052e+08, grad_fn=<MseLossBackward>)
output :  tensor([[246214.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(14332850., grad_fn=<MseLossBackward>)
output :  tensor([[158978.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8520e+08, grad_fn=<MseLossBackward>)
output :  tensor([[243792.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2425806.2500, grad_fn=<MseLossBackward>)
output :  tensor([[143282.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(515052.9062, grad_fn=<MseLossBackward>)
output :  tensor([[208623.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1893419., grad_fn=<MseLossBackward>)
output :  tensor([[175323.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(8545299., grad_fn=<MseLossBackward>)
output :  tensor([[153274.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(526645., grad_fn=<MseLossBackward>)
output :  tensor([[118256.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(65672.0703, grad_fn=<MseLossBackward>)
output :  tensor([[239706.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2452e+09, grad_fn=<MseLossBackward>)
output :  tensor([[236773.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(10411008., grad_fn=<MseLossBackward>)
output :  tensor([[151184.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(4634130.5000, grad_fn=<MseLossBackward>)
output :  tensor([[255291.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(153284.4844, grad_fn=<MseLossBackward>)
output :  tensor([[126059.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3353e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177211.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1468603.1250, grad_fn=<MseLossBackward>)
output :  tensor([[161112.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1237969.1250, grad_fn=<MseLossBackward>)
output :  tensor([[134944.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(15560559., grad_fn=<MseLossBackward>)
output :  tensor([[193403.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0837e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163801.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(39315.4531, grad_fn=<MseLossBackward>)
output :  tensor([[165894.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(8378763.5000, grad_fn=<MseLossBackward>)
output :  tensor([[157728.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(73890.5312, grad_fn=<MseLossBackward>)
output :  tensor([[152258.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(5561711.5000, grad_fn=<MseLossBackward>)
output :  tensor([[171062.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7900e+09, grad_fn=<MseLossBackward>)
output :  tensor([[160554.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(307504.9062, grad_fn=<MseLossBackward>)
output :  tensor([[376777.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(51726212., grad_fn=<MseLossBackward>)
output :  tensor([[134721.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(59626388., grad_fn=<MseLossBackward>)
output :  tensor([[131520.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1179e+09, grad_fn=<MseLossBackward>)
output :  tensor([[277287.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(15412985., grad_fn=<MseLossBackward>)
output :  tensor([[162042.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1812.8967, grad_fn=<MseLossBackward>)
output :  tensor([[128705.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(67330232., grad_fn=<MseLossBackward>)
output :  tensor([[240262.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(68264520., grad_fn=<MseLossBackward>)
output :  tensor([[177782.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(7385485.5000, grad_fn=<MseLossBackward>)
output :  tensor([[156081.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(16656474., grad_fn=<MseLossBackward>)
output :  tensor([[147204.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(4859131.5000, grad_fn=<MseLossBackward>)
output :  tensor([[152223.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3482e+08, grad_fn=<MseLossBackward>)
output :  tensor([[100709.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(503556.5625, grad_fn=<MseLossBackward>)
output :  tensor([[70239.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0485e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166193.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1423808.2500, grad_fn=<MseLossBackward>)
output :  tensor([[188575.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5543e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161580.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(12818861., grad_fn=<MseLossBackward>)
output :  tensor([[161419.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(15366033., grad_fn=<MseLossBackward>)
output :  tensor([[137763.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(97998.3438, grad_fn=<MseLossBackward>)
output :  tensor([[209745.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(14404990., grad_fn=<MseLossBackward>)
output :  tensor([[141381.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(11436444., grad_fn=<MseLossBackward>)
output :  tensor([[184546.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5738e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144981.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1037501.3750, grad_fn=<MseLossBackward>)
output :  tensor([[106826.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6772e+08, grad_fn=<MseLossBackward>)
output :  tensor([[95227.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1507063.1250, grad_fn=<MseLossBackward>)
output :  tensor([[173911.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1185818.8750, grad_fn=<MseLossBackward>)
output :  tensor([[274691.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0424e+08, grad_fn=<MseLossBackward>)
output :  tensor([[141980.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(231180.6562, grad_fn=<MseLossBackward>)
output :  tensor([[158847.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1098140.2500, grad_fn=<MseLossBackward>)
output :  tensor([[135318.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(7942973.5000, grad_fn=<MseLossBackward>)
output :  tensor([[150251.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(565457., grad_fn=<MseLossBackward>)
output :  tensor([[167183.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(513820.1562, grad_fn=<MseLossBackward>)
output :  tensor([[128221.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(1491623.2500, grad_fn=<MseLossBackward>)
output :  tensor([[170587.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5470e+08, grad_fn=<MseLossBackward>)
output :  tensor([[155815.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1402892.2500, grad_fn=<MseLossBackward>)
output :  tensor([[117152.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(425868.4062, grad_fn=<MseLossBackward>)
output :  tensor([[160892.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1995e+09, grad_fn=<MseLossBackward>)
output :  tensor([[53371.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1881398., grad_fn=<MseLossBackward>)
output :  tensor([[232957.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3271e+09, grad_fn=<MseLossBackward>)
output :  tensor([[198117.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(8308806., grad_fn=<MseLossBackward>)
output :  tensor([[189160.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(17310930., grad_fn=<MseLossBackward>)
output :  tensor([[106046.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2194.3369, grad_fn=<MseLossBackward>)
output :  tensor([[89029.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(4117126.2500, grad_fn=<MseLossBackward>)
output :  tensor([[145708.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(32589292., grad_fn=<MseLossBackward>)
output :  tensor([[223178.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0157e+09, grad_fn=<MseLossBackward>)
output :  tensor([[205546.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(3816467.5000, grad_fn=<MseLossBackward>)
output :  tensor([[164958.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1748.2852, grad_fn=<MseLossBackward>)
output :  tensor([[174258.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2340e+09, grad_fn=<MseLossBackward>)
output :  tensor([[189328.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(450702.4375, grad_fn=<MseLossBackward>)
output :  tensor([[89664.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(7097895., grad_fn=<MseLossBackward>)
output :  tensor([[138471.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2337554.2500, grad_fn=<MseLossBackward>)
output :  tensor([[106951.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(12594514., grad_fn=<MseLossBackward>)
output :  tensor([[147514.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3350e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173780.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8301e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192874.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4703e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178705.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1674557.3750, grad_fn=<MseLossBackward>)
output :  tensor([[98277.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(3158617.5000, grad_fn=<MseLossBackward>)
output :  tensor([[117330.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(28889.3750, grad_fn=<MseLossBackward>)
output :  tensor([[162659.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5543e+08, grad_fn=<MseLossBackward>)
output :  tensor([[202319.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(5381530., grad_fn=<MseLossBackward>)
output :  tensor([[141482.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(6337806., grad_fn=<MseLossBackward>)
train_loss: [2.5629327e+09]
epoch_result tensor([0.])
output :  tensor([[157270.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1512285., grad_fn=<MseLossBackward>)
output :  tensor([[122079.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(6244.7036, grad_fn=<MseLossBackward>)
output :  tensor([[191266.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(8613308., grad_fn=<MseLossBackward>)
output :  tensor([[178601.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2563601.2500, grad_fn=<MseLossBackward>)
output :  tensor([[152029.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7448e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129912.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(3656879.2500, grad_fn=<MseLossBackward>)
output :  tensor([[139528.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2166094., grad_fn=<MseLossBackward>)
output :  tensor([[118575.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(180080.8750, grad_fn=<MseLossBackward>)
output :  tensor([[63913.2383]], grad_fn=<AddmmBackward>)
loss:  tensor(29303148., grad_fn=<MseLossBackward>)
output :  tensor([[167615.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2610446., grad_fn=<MseLossBackward>)
output :  tensor([[141113.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1238977.7500, grad_fn=<MseLossBackward>)
output :  tensor([[225969.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(940354.4375, grad_fn=<MseLossBackward>)
output :  tensor([[168983.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(286.8789, grad_fn=<MseLossBackward>)
output :  tensor([[247769.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(3725503.2500, grad_fn=<MseLossBackward>)
output :  tensor([[56725.2539]], grad_fn=<AddmmBackward>)
loss:  tensor(2976501., grad_fn=<MseLossBackward>)
output :  tensor([[162099.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0973e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177631.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(6922736.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163798.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(53264452., grad_fn=<MseLossBackward>)
output :  tensor([[275989.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(978677.3750, grad_fn=<MseLossBackward>)
output :  tensor([[195742.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1581581.3750, grad_fn=<MseLossBackward>)
output :  tensor([[139539.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4507e+10, grad_fn=<MseLossBackward>)
output :  tensor([[196072.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(4811305., grad_fn=<MseLossBackward>)
output :  tensor([[180531.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9685e+09, grad_fn=<MseLossBackward>)
output :  tensor([[152914.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3664951.2500, grad_fn=<MseLossBackward>)
output :  tensor([[177586.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(57557828., grad_fn=<MseLossBackward>)
output :  tensor([[87927.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(6388374.5000, grad_fn=<MseLossBackward>)
output :  tensor([[170581.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3157e+09, grad_fn=<MseLossBackward>)
output :  tensor([[187291.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(5249826.5000, grad_fn=<MseLossBackward>)
output :  tensor([[206936.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3584e+09, grad_fn=<MseLossBackward>)
output :  tensor([[108960.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1080592.7500, grad_fn=<MseLossBackward>)
output :  tensor([[170469.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(281231.3438, grad_fn=<MseLossBackward>)
output :  tensor([[137385.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(783280.3125, grad_fn=<MseLossBackward>)
output :  tensor([[131255.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(5089183.5000, grad_fn=<MseLossBackward>)
output :  tensor([[121160.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(2758687.5000, grad_fn=<MseLossBackward>)
output :  tensor([[146876.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(8.9259e+08, grad_fn=<MseLossBackward>)
output :  tensor([[167164.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1855e+10, grad_fn=<MseLossBackward>)
output :  tensor([[150347.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(419316.9688, grad_fn=<MseLossBackward>)
output :  tensor([[181911.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(3654728.2500, grad_fn=<MseLossBackward>)
output :  tensor([[143169.]], grad_fn=<AddmmBackward>)
loss:  tensor(4704561., grad_fn=<MseLossBackward>)
output :  tensor([[107675.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1243e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136519.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1591e+09, grad_fn=<MseLossBackward>)
output :  tensor([[134721.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(77466.5469, grad_fn=<MseLossBackward>)
output :  tensor([[128990.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3962836.7500, grad_fn=<MseLossBackward>)
output :  tensor([[223041.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(3836150.7500, grad_fn=<MseLossBackward>)
output :  tensor([[133059.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(654860.2500, grad_fn=<MseLossBackward>)
output :  tensor([[145440.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(12670485., grad_fn=<MseLossBackward>)
output :  tensor([[115622.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(13121884., grad_fn=<MseLossBackward>)
output :  tensor([[161065.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1135723.1250, grad_fn=<MseLossBackward>)
output :  tensor([[147179.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2868e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195379.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(11421760., grad_fn=<MseLossBackward>)
output :  tensor([[135932.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2198455., grad_fn=<MseLossBackward>)
output :  tensor([[97385.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5913e+08, grad_fn=<MseLossBackward>)
output :  tensor([[235082.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1172753.6250, grad_fn=<MseLossBackward>)
output :  tensor([[166378.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2195e+09, grad_fn=<MseLossBackward>)
output :  tensor([[152892.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(37295832., grad_fn=<MseLossBackward>)
output :  tensor([[206024.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7714e+10, grad_fn=<MseLossBackward>)
output :  tensor([[248659.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1097e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145006.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2269401., grad_fn=<MseLossBackward>)
output :  tensor([[132912.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1181840.7500, grad_fn=<MseLossBackward>)
output :  tensor([[153520.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2190353.7500, grad_fn=<MseLossBackward>)
output :  tensor([[133713.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(13791707., grad_fn=<MseLossBackward>)
output :  tensor([[180505.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3193e+09, grad_fn=<MseLossBackward>)
output :  tensor([[178950.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(26518476., grad_fn=<MseLossBackward>)
output :  tensor([[163003.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2260277.2500, grad_fn=<MseLossBackward>)
output :  tensor([[143441.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(195336.3750, grad_fn=<MseLossBackward>)
output :  tensor([[142950.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(202823.5625, grad_fn=<MseLossBackward>)
output :  tensor([[142129.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(8239501., grad_fn=<MseLossBackward>)
output :  tensor([[173458.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3861e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194938.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8672e+08, grad_fn=<MseLossBackward>)
output :  tensor([[138875.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(5641738.5000, grad_fn=<MseLossBackward>)
output :  tensor([[173606.]], grad_fn=<AddmmBackward>)
loss:  tensor(2910436., grad_fn=<MseLossBackward>)
output :  tensor([[175895.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(26054166., grad_fn=<MseLossBackward>)
output :  tensor([[114240.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(576935.1875, grad_fn=<MseLossBackward>)
output :  tensor([[218586.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(5824680.5000, grad_fn=<MseLossBackward>)
output :  tensor([[183292.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(42991.4297, grad_fn=<MseLossBackward>)
output :  tensor([[126366.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(750835.8125, grad_fn=<MseLossBackward>)
output :  tensor([[195995.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(254882.9844, grad_fn=<MseLossBackward>)
output :  tensor([[176694.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(3220398.5000, grad_fn=<MseLossBackward>)
output :  tensor([[212473.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0198e+10, grad_fn=<MseLossBackward>)
output :  tensor([[209119.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(3535986.5000, grad_fn=<MseLossBackward>)
output :  tensor([[164678.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1342e+09, grad_fn=<MseLossBackward>)
output :  tensor([[191161.]], grad_fn=<AddmmBackward>)
loss:  tensor(11148921., grad_fn=<MseLossBackward>)
output :  tensor([[113099.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(9862.9727, grad_fn=<MseLossBackward>)
output :  tensor([[114598.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(4403768., grad_fn=<MseLossBackward>)
output :  tensor([[114711.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(7350622.5000, grad_fn=<MseLossBackward>)
output :  tensor([[146511.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(82998.0078, grad_fn=<MseLossBackward>)
output :  tensor([[159698.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3469e+10, grad_fn=<MseLossBackward>)
output :  tensor([[181489.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2218750., grad_fn=<MseLossBackward>)
output :  tensor([[126935.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(319207.3438, grad_fn=<MseLossBackward>)
output :  tensor([[144204.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(633342.3750, grad_fn=<MseLossBackward>)
output :  tensor([[182534.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2691e+09, grad_fn=<MseLossBackward>)
output :  tensor([[119591.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(7243751.5000, grad_fn=<MseLossBackward>)
output :  tensor([[193386.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(13060205., grad_fn=<MseLossBackward>)
output :  tensor([[144571.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(183920.3594, grad_fn=<MseLossBackward>)
output :  tensor([[211560.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1793758., grad_fn=<MseLossBackward>)
output :  tensor([[125648.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(123640.1406, grad_fn=<MseLossBackward>)
output :  tensor([[245950.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(5651392., grad_fn=<MseLossBackward>)
output :  tensor([[242535.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8032e+09, grad_fn=<MseLossBackward>)
output :  tensor([[147078.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4582e+08, grad_fn=<MseLossBackward>)
output :  tensor([[86440.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4720e+08, grad_fn=<MseLossBackward>)
output :  tensor([[194662.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4380e+09, grad_fn=<MseLossBackward>)
output :  tensor([[84220.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(10370513., grad_fn=<MseLossBackward>)
output :  tensor([[138727.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(596973.5625, grad_fn=<MseLossBackward>)
output :  tensor([[74649.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(722725.8125, grad_fn=<MseLossBackward>)
output :  tensor([[143796.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(711571.3125, grad_fn=<MseLossBackward>)
output :  tensor([[176409.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(167920.6719, grad_fn=<MseLossBackward>)
output :  tensor([[152058.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2076571.1250, grad_fn=<MseLossBackward>)
output :  tensor([[106872.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(278718., grad_fn=<MseLossBackward>)
output :  tensor([[205444.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2167e+10, grad_fn=<MseLossBackward>)
output :  tensor([[129691.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1420417., grad_fn=<MseLossBackward>)
output :  tensor([[268489.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3250e+08, grad_fn=<MseLossBackward>)
output :  tensor([[305957.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(16338775., grad_fn=<MseLossBackward>)
output :  tensor([[109586.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(4351494., grad_fn=<MseLossBackward>)
output :  tensor([[171224.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1625744.5000, grad_fn=<MseLossBackward>)
output :  tensor([[134118.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8219e+08, grad_fn=<MseLossBackward>)
output :  tensor([[149477.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0978e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129126.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1261620.3750, grad_fn=<MseLossBackward>)
output :  tensor([[132114.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(50623004., grad_fn=<MseLossBackward>)
output :  tensor([[135849.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9431e+08, grad_fn=<MseLossBackward>)
output :  tensor([[228170.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7959e+10, grad_fn=<MseLossBackward>)
output :  tensor([[192081.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2177e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145606.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2911715.7500, grad_fn=<MseLossBackward>)
output :  tensor([[128724.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1499515., grad_fn=<MseLossBackward>)
output :  tensor([[117126.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(34531508., grad_fn=<MseLossBackward>)
output :  tensor([[258075.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5983e+09, grad_fn=<MseLossBackward>)
output :  tensor([[134200.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(639575.0625, grad_fn=<MseLossBackward>)
output :  tensor([[200588.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(5815332., grad_fn=<MseLossBackward>)
output :  tensor([[99206.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(32413362., grad_fn=<MseLossBackward>)
output :  tensor([[139026.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(852361.6875, grad_fn=<MseLossBackward>)
output :  tensor([[209058.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3844e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178116.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3180426.5000, grad_fn=<MseLossBackward>)
output :  tensor([[185789.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(623137.5625, grad_fn=<MseLossBackward>)
output :  tensor([[163234.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1248e+10, grad_fn=<MseLossBackward>)
output :  tensor([[301406.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1285e+09, grad_fn=<MseLossBackward>)
output :  tensor([[198985.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1179328.1250, grad_fn=<MseLossBackward>)
output :  tensor([[260611.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0235e+10, grad_fn=<MseLossBackward>)
output :  tensor([[225842.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6126e+09, grad_fn=<MseLossBackward>)
output :  tensor([[285402.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9842e+08, grad_fn=<MseLossBackward>)
output :  tensor([[225011.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1022373.7500, grad_fn=<MseLossBackward>)
output :  tensor([[222782.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8635e+10, grad_fn=<MseLossBackward>)
output :  tensor([[197484.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(234346.7656, grad_fn=<MseLossBackward>)
output :  tensor([[158034.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4300e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130241.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(5100046., grad_fn=<MseLossBackward>)
output :  tensor([[134439.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1125654.7500, grad_fn=<MseLossBackward>)
output :  tensor([[90050.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(901342.5625, grad_fn=<MseLossBackward>)
output :  tensor([[105997.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4011946.5000, grad_fn=<MseLossBackward>)
output :  tensor([[275776.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8221e+09, grad_fn=<MseLossBackward>)
output :  tensor([[233992.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1015528.5625, grad_fn=<MseLossBackward>)
output :  tensor([[146447.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2095663.3750, grad_fn=<MseLossBackward>)
output :  tensor([[138106.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(367671.6875, grad_fn=<MseLossBackward>)
output :  tensor([[177972.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(17976276., grad_fn=<MseLossBackward>)
output :  tensor([[145515.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(70672.8984, grad_fn=<MseLossBackward>)
output :  tensor([[167025.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5486e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165373.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(139152.3125, grad_fn=<MseLossBackward>)
output :  tensor([[139271.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(5160635., grad_fn=<MseLossBackward>)
output :  tensor([[188052.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2971e+09, grad_fn=<MseLossBackward>)
output :  tensor([[116738.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(22450790., grad_fn=<MseLossBackward>)
output :  tensor([[180791.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(77298712., grad_fn=<MseLossBackward>)
output :  tensor([[115813.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(17525604., grad_fn=<MseLossBackward>)
output :  tensor([[87449.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(201825.5625, grad_fn=<MseLossBackward>)
output :  tensor([[179525.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(225165.0781, grad_fn=<MseLossBackward>)
output :  tensor([[110381.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(231902.4375, grad_fn=<MseLossBackward>)
output :  tensor([[238966.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1106.6018, grad_fn=<MseLossBackward>)
output :  tensor([[246103.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1218264., grad_fn=<MseLossBackward>)
output :  tensor([[127557.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(3772183.2500, grad_fn=<MseLossBackward>)
output :  tensor([[110497.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(2365876.5000, grad_fn=<MseLossBackward>)
output :  tensor([[290157.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1608e+10, grad_fn=<MseLossBackward>)
output :  tensor([[171919.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(175678.8594, grad_fn=<MseLossBackward>)
output :  tensor([[124543.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(208592.0156, grad_fn=<MseLossBackward>)
output :  tensor([[142775.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1384e+08, grad_fn=<MseLossBackward>)
output :  tensor([[203572.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0873e+08, grad_fn=<MseLossBackward>)
output :  tensor([[139363.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2678694.7500, grad_fn=<MseLossBackward>)
output :  tensor([[158234.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4827e+10, grad_fn=<MseLossBackward>)
output :  tensor([[157262.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(11303359., grad_fn=<MseLossBackward>)
output :  tensor([[131073.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2476590.7500, grad_fn=<MseLossBackward>)
output :  tensor([[251282.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6184e+10, grad_fn=<MseLossBackward>)
output :  tensor([[400832.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1364078., grad_fn=<MseLossBackward>)
output :  tensor([[113634.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(21478010., grad_fn=<MseLossBackward>)
output :  tensor([[120469.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(3880222.7500, grad_fn=<MseLossBackward>)
output :  tensor([[159472.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(739.1602, grad_fn=<MseLossBackward>)
output :  tensor([[128840.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3299e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163237.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4530e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173492.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0313e+09, grad_fn=<MseLossBackward>)
output :  tensor([[103221.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(142925.3438, grad_fn=<MseLossBackward>)
output :  tensor([[139774.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1502539.6250, grad_fn=<MseLossBackward>)
output :  tensor([[364881.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(5820307., grad_fn=<MseLossBackward>)
output :  tensor([[208368.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0822e+09, grad_fn=<MseLossBackward>)
output :  tensor([[179404.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(15245486., grad_fn=<MseLossBackward>)
output :  tensor([[202207.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(479945.8750, grad_fn=<MseLossBackward>)
output :  tensor([[137366.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2667301.5000, grad_fn=<MseLossBackward>)
output :  tensor([[197470.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(8824149., grad_fn=<MseLossBackward>)
output :  tensor([[133716.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8728e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178454.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(6479729.5000, grad_fn=<MseLossBackward>)
output :  tensor([[238212.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(14344564., grad_fn=<MseLossBackward>)
output :  tensor([[173598.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(161478.4062, grad_fn=<MseLossBackward>)
output :  tensor([[106156.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3396937., grad_fn=<MseLossBackward>)
output :  tensor([[263762.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(637552.3750, grad_fn=<MseLossBackward>)
output :  tensor([[246682.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(11003940., grad_fn=<MseLossBackward>)
output :  tensor([[124287.2266]], grad_fn=<AddmmBackward>)
loss:  tensor(1656952.2500, grad_fn=<MseLossBackward>)
output :  tensor([[217320.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3270e+09, grad_fn=<MseLossBackward>)
output :  tensor([[304564.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2995e+08, grad_fn=<MseLossBackward>)
output :  tensor([[206680.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(102000.3906, grad_fn=<MseLossBackward>)
output :  tensor([[215190.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5577e+10, grad_fn=<MseLossBackward>)
output :  tensor([[161641.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(13999641., grad_fn=<MseLossBackward>)
output :  tensor([[171273.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1646369.6250, grad_fn=<MseLossBackward>)
output :  tensor([[162114.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(26862032., grad_fn=<MseLossBackward>)
output :  tensor([[170986.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(974107.3125, grad_fn=<MseLossBackward>)
output :  tensor([[240027.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8247e+08, grad_fn=<MseLossBackward>)
output :  tensor([[226275.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(10113791., grad_fn=<MseLossBackward>)
output :  tensor([[159389.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5351e+08, grad_fn=<MseLossBackward>)
output :  tensor([[125927.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(8569296., grad_fn=<MseLossBackward>)
output :  tensor([[179545.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(6481002., grad_fn=<MseLossBackward>)
output :  tensor([[182594.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9917e+09, grad_fn=<MseLossBackward>)
output :  tensor([[212898.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3021e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134391.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1674.5999, grad_fn=<MseLossBackward>)
output :  tensor([[148736.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3636e+08, grad_fn=<MseLossBackward>)
output :  tensor([[277031.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1020.0039, grad_fn=<MseLossBackward>)
output :  tensor([[86958.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(3834253.5000, grad_fn=<MseLossBackward>)
output :  tensor([[233880.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(6863663., grad_fn=<MseLossBackward>)
output :  tensor([[262306.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0280e+11, grad_fn=<MseLossBackward>)
output :  tensor([[168040.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(3840252.5000, grad_fn=<MseLossBackward>)
output :  tensor([[195937.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5259e+09, grad_fn=<MseLossBackward>)
output :  tensor([[152989.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(4042864.2500, grad_fn=<MseLossBackward>)
output :  tensor([[208362.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7992e+09, grad_fn=<MseLossBackward>)
output :  tensor([[128481.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(268785.5312, grad_fn=<MseLossBackward>)
output :  tensor([[144139.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(740729.1875, grad_fn=<MseLossBackward>)
output :  tensor([[169167.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1115e+08, grad_fn=<MseLossBackward>)
output :  tensor([[187371.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2315770.5000, grad_fn=<MseLossBackward>)
output :  tensor([[126377.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(142358.8281, grad_fn=<MseLossBackward>)
output :  tensor([[137975.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2177699.7500, grad_fn=<MseLossBackward>)
output :  tensor([[171802.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1434081.1250, grad_fn=<MseLossBackward>)
output :  tensor([[196152.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8995e+09, grad_fn=<MseLossBackward>)
output :  tensor([[243459.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(210924.9219, grad_fn=<MseLossBackward>)
output :  tensor([[155038.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1506.4102, grad_fn=<MseLossBackward>)
output :  tensor([[194457.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2378727.7500, grad_fn=<MseLossBackward>)
output :  tensor([[160114.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5967e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176485.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(9089377., grad_fn=<MseLossBackward>)
output :  tensor([[181217.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1734900.6250, grad_fn=<MseLossBackward>)
output :  tensor([[101961.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(24620668., grad_fn=<MseLossBackward>)
output :  tensor([[172562.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1543e+10, grad_fn=<MseLossBackward>)
output :  tensor([[132892.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(4440897.5000, grad_fn=<MseLossBackward>)
output :  tensor([[121090.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(37098852., grad_fn=<MseLossBackward>)
output :  tensor([[172812.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1410007.8750, grad_fn=<MseLossBackward>)
output :  tensor([[85953.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(909549.6250, grad_fn=<MseLossBackward>)
output :  tensor([[291641.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2693906.7500, grad_fn=<MseLossBackward>)
output :  tensor([[171928.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(48006712., grad_fn=<MseLossBackward>)
output :  tensor([[195027.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9083e+10, grad_fn=<MseLossBackward>)
output :  tensor([[249517.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6150e+08, grad_fn=<MseLossBackward>)
output :  tensor([[149705.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1676863.1250, grad_fn=<MseLossBackward>)
output :  tensor([[125474.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2174795.5000, grad_fn=<MseLossBackward>)
output :  tensor([[115419.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(20079150., grad_fn=<MseLossBackward>)
output :  tensor([[143352.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0384e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174971.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(943690.8125, grad_fn=<MseLossBackward>)
output :  tensor([[111765.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5648e+08, grad_fn=<MseLossBackward>)
output :  tensor([[213146.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0994e+10, grad_fn=<MseLossBackward>)
output :  tensor([[244459.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(8757253., grad_fn=<MseLossBackward>)
output :  tensor([[253009.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0216e+10, grad_fn=<MseLossBackward>)
output :  tensor([[220423.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4508e+08, grad_fn=<MseLossBackward>)
output :  tensor([[196700.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4113e+10, grad_fn=<MseLossBackward>)
output :  tensor([[190564.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(9393555., grad_fn=<MseLossBackward>)
output :  tensor([[207560.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7223e+10, grad_fn=<MseLossBackward>)
output :  tensor([[188772.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1676e+10, grad_fn=<MseLossBackward>)
output :  tensor([[180829.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(4365031., grad_fn=<MseLossBackward>)
output :  tensor([[152448.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(201544.8750, grad_fn=<MseLossBackward>)
output :  tensor([[333634.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(11327011., grad_fn=<MseLossBackward>)
output :  tensor([[214820.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(7953898., grad_fn=<MseLossBackward>)
output :  tensor([[161331.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1773350., grad_fn=<MseLossBackward>)
output :  tensor([[187379.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9290e+09, grad_fn=<MseLossBackward>)
output :  tensor([[109969.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(24699968., grad_fn=<MseLossBackward>)
output :  tensor([[273457.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9266e+10, grad_fn=<MseLossBackward>)
output :  tensor([[170103.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(14412345., grad_fn=<MseLossBackward>)
output :  tensor([[212840.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(434981.4688, grad_fn=<MseLossBackward>)
output :  tensor([[216651.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(18905920., grad_fn=<MseLossBackward>)
output :  tensor([[180869.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2787126., grad_fn=<MseLossBackward>)
output :  tensor([[204227.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(5891239., grad_fn=<MseLossBackward>)
output :  tensor([[157221.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(4934229., grad_fn=<MseLossBackward>)
output :  tensor([[146750.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1856e+09, grad_fn=<MseLossBackward>)
output :  tensor([[119719.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1487294.6250, grad_fn=<MseLossBackward>)
output :  tensor([[139594.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(164569.6719, grad_fn=<MseLossBackward>)
output :  tensor([[147505.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2234044., grad_fn=<MseLossBackward>)
output :  tensor([[201817.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5922e+10, grad_fn=<MseLossBackward>)
output :  tensor([[162027.]], grad_fn=<AddmmBackward>)
loss:  tensor(6385729., grad_fn=<MseLossBackward>)
output :  tensor([[99294.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(42230.2500, grad_fn=<MseLossBackward>)
output :  tensor([[226789.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7452e+08, grad_fn=<MseLossBackward>)
output :  tensor([[186194.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2827e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174818.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2776909.7500, grad_fn=<MseLossBackward>)
output :  tensor([[84108.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(4444224., grad_fn=<MseLossBackward>)
output :  tensor([[130236.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(3015269.5000, grad_fn=<MseLossBackward>)
output :  tensor([[216902.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(8425595., grad_fn=<MseLossBackward>)
output :  tensor([[144502.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(252333.5469, grad_fn=<MseLossBackward>)
output :  tensor([[133678.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(13529408., grad_fn=<MseLossBackward>)
output :  tensor([[143629.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1059484.2500, grad_fn=<MseLossBackward>)
output :  tensor([[175302.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4291e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144692.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(478885.6250, grad_fn=<MseLossBackward>)
output :  tensor([[159974.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(671.9436, grad_fn=<MseLossBackward>)
output :  tensor([[213368.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2661792.2500, grad_fn=<MseLossBackward>)
output :  tensor([[134082.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4582e+08, grad_fn=<MseLossBackward>)
output :  tensor([[255165.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(27307.5625, grad_fn=<MseLossBackward>)
output :  tensor([[160919.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2016222.5000, grad_fn=<MseLossBackward>)
output :  tensor([[130512.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(4049810.2500, grad_fn=<MseLossBackward>)
output :  tensor([[94640.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(129116.7031, grad_fn=<MseLossBackward>)
output :  tensor([[151502.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4894e+09, grad_fn=<MseLossBackward>)
output :  tensor([[176951.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(8693099., grad_fn=<MseLossBackward>)
output :  tensor([[120374.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(15775.7529, grad_fn=<MseLossBackward>)
output :  tensor([[189520.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5547e+09, grad_fn=<MseLossBackward>)
output :  tensor([[143743.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1273e+09, grad_fn=<MseLossBackward>)
output :  tensor([[148860.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1079683.3750, grad_fn=<MseLossBackward>)
output :  tensor([[187612.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(18846.1406, grad_fn=<MseLossBackward>)
output :  tensor([[253063.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6011e+09, grad_fn=<MseLossBackward>)
output :  tensor([[92274.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(599523.5625, grad_fn=<MseLossBackward>)
output :  tensor([[235934.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(16530831., grad_fn=<MseLossBackward>)
output :  tensor([[131734.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(10461485., grad_fn=<MseLossBackward>)
output :  tensor([[165088.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0163e+10, grad_fn=<MseLossBackward>)
output :  tensor([[113281.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7639e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176100.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(10097.1094, grad_fn=<MseLossBackward>)
output :  tensor([[163494.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8052e+08, grad_fn=<MseLossBackward>)
output :  tensor([[154360.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6935e+08, grad_fn=<MseLossBackward>)
output :  tensor([[233159.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(34114908., grad_fn=<MseLossBackward>)
output :  tensor([[225593.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0502e+09, grad_fn=<MseLossBackward>)
output :  tensor([[125957.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(1086431.6250, grad_fn=<MseLossBackward>)
output :  tensor([[125358.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(411021.2188, grad_fn=<MseLossBackward>)
output :  tensor([[226917.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(6754.7852, grad_fn=<MseLossBackward>)
output :  tensor([[229480.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(20425174., grad_fn=<MseLossBackward>)
output :  tensor([[224871.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(3344155., grad_fn=<MseLossBackward>)
output :  tensor([[149284.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1650542.3750, grad_fn=<MseLossBackward>)
output :  tensor([[206124.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(15017199., grad_fn=<MseLossBackward>)
output :  tensor([[128892.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(79072944., grad_fn=<MseLossBackward>)
output :  tensor([[136604.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(16846664., grad_fn=<MseLossBackward>)
output :  tensor([[310964.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(16283495., grad_fn=<MseLossBackward>)
output :  tensor([[141288.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(83142.1172, grad_fn=<MseLossBackward>)
output :  tensor([[121483.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9684e+09, grad_fn=<MseLossBackward>)
output :  tensor([[108537.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(926045.3750, grad_fn=<MseLossBackward>)
output :  tensor([[157523.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2430e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181804.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(8.6343e+09, grad_fn=<MseLossBackward>)
output :  tensor([[172127.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(761310.8125, grad_fn=<MseLossBackward>)
output :  tensor([[193820.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(51548812., grad_fn=<MseLossBackward>)
output :  tensor([[103650.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(13323755., grad_fn=<MseLossBackward>)
output :  tensor([[178924.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(5636.7246, grad_fn=<MseLossBackward>)
output :  tensor([[169995.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(4390465.5000, grad_fn=<MseLossBackward>)
output :  tensor([[137594.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1975474.1250, grad_fn=<MseLossBackward>)
output :  tensor([[265565.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7487e+09, grad_fn=<MseLossBackward>)
output :  tensor([[142565.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3137e+09, grad_fn=<MseLossBackward>)
output :  tensor([[171882.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1249050.7500, grad_fn=<MseLossBackward>)
output :  tensor([[142483.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(6167074., grad_fn=<MseLossBackward>)
output :  tensor([[200745.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(60132.2344, grad_fn=<MseLossBackward>)
output :  tensor([[167438.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(6563684., grad_fn=<MseLossBackward>)
output :  tensor([[244025.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(670.3245, grad_fn=<MseLossBackward>)
output :  tensor([[136197.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2880498.5000, grad_fn=<MseLossBackward>)
output :  tensor([[151068.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2954692.5000, grad_fn=<MseLossBackward>)
output :  tensor([[215072.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(5319.8789, grad_fn=<MseLossBackward>)
output :  tensor([[164054.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(893290.8125, grad_fn=<MseLossBackward>)
output :  tensor([[191227.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(4961756., grad_fn=<MseLossBackward>)
output :  tensor([[129986.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4177e+08, grad_fn=<MseLossBackward>)
output :  tensor([[127355.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2703763.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140952.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(907970.7500, grad_fn=<MseLossBackward>)
output :  tensor([[204223.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2610e+09, grad_fn=<MseLossBackward>)
output :  tensor([[167574.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7641e+09, grad_fn=<MseLossBackward>)
output :  tensor([[73865.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9225e+08, grad_fn=<MseLossBackward>)
output :  tensor([[92600.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(65625820., grad_fn=<MseLossBackward>)
output :  tensor([[257261.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(15752465., grad_fn=<MseLossBackward>)
output :  tensor([[203646.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1792e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113793.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(1454530.2500, grad_fn=<MseLossBackward>)
output :  tensor([[155569.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0195e+09, grad_fn=<MseLossBackward>)
output :  tensor([[209639.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0733e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181873.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7664e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159977.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(24777684., grad_fn=<MseLossBackward>)
output :  tensor([[166141.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(14885490., grad_fn=<MseLossBackward>)
output :  tensor([[117580.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(6657206.5000, grad_fn=<MseLossBackward>)
output :  tensor([[158951.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(15610895., grad_fn=<MseLossBackward>)
output :  tensor([[193605.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7674e+08, grad_fn=<MseLossBackward>)
output :  tensor([[220885.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1920606.2500, grad_fn=<MseLossBackward>)
output :  tensor([[248261.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4675e+11, grad_fn=<MseLossBackward>)
output :  tensor([[144960.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(4160070.2500, grad_fn=<MseLossBackward>)
output :  tensor([[110212.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(3000987.7500, grad_fn=<MseLossBackward>)
output :  tensor([[171566.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0678e+08, grad_fn=<MseLossBackward>)
output :  tensor([[144632.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(34432872., grad_fn=<MseLossBackward>)
output :  tensor([[233018.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(15851845., grad_fn=<MseLossBackward>)
output :  tensor([[115571.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(326871.2500, grad_fn=<MseLossBackward>)
output :  tensor([[183273.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(139572.2969, grad_fn=<MseLossBackward>)
output :  tensor([[185389.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1717123.6250, grad_fn=<MseLossBackward>)
output :  tensor([[165763.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3789e+10, grad_fn=<MseLossBackward>)
output :  tensor([[98139.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9375e+08, grad_fn=<MseLossBackward>)
output :  tensor([[235633.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(11336058., grad_fn=<MseLossBackward>)
output :  tensor([[178713.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(7365711., grad_fn=<MseLossBackward>)
output :  tensor([[142234.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(4994666.5000, grad_fn=<MseLossBackward>)
output :  tensor([[238574.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(12775151., grad_fn=<MseLossBackward>)
output :  tensor([[157372.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(31673152., grad_fn=<MseLossBackward>)
output :  tensor([[206516.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4038e+10, grad_fn=<MseLossBackward>)
output :  tensor([[135271.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(73678.3125, grad_fn=<MseLossBackward>)
output :  tensor([[187885.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7006e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134130.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(3496023.5000, grad_fn=<MseLossBackward>)
output :  tensor([[229069.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(48034644., grad_fn=<MseLossBackward>)
output :  tensor([[226631.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4609e+08, grad_fn=<MseLossBackward>)
output :  tensor([[88491.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2274676.7500, grad_fn=<MseLossBackward>)
output :  tensor([[158444.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(980038.1250, grad_fn=<MseLossBackward>)
output :  tensor([[247805.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5147e+10, grad_fn=<MseLossBackward>)
output :  tensor([[147289.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(5241738.5000, grad_fn=<MseLossBackward>)
output :  tensor([[108147.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6931e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163839.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(435806.2812, grad_fn=<MseLossBackward>)
output :  tensor([[145033.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1067863.8750, grad_fn=<MseLossBackward>)
output :  tensor([[129221.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(1044276.4375, grad_fn=<MseLossBackward>)
output :  tensor([[188702.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9417e+09, grad_fn=<MseLossBackward>)
output :  tensor([[123226.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(528097.4375, grad_fn=<MseLossBackward>)
output :  tensor([[149351.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(7013476.5000, grad_fn=<MseLossBackward>)
output :  tensor([[169163.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(6689012.5000, grad_fn=<MseLossBackward>)
output :  tensor([[151064.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(4222.9688, grad_fn=<MseLossBackward>)
output :  tensor([[158347.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(20725968., grad_fn=<MseLossBackward>)
output :  tensor([[137190.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9470e+08, grad_fn=<MseLossBackward>)
output :  tensor([[132277.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(76971.5625, grad_fn=<MseLossBackward>)
output :  tensor([[154366.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3612e+08, grad_fn=<MseLossBackward>)
output :  tensor([[147301.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(9921811., grad_fn=<MseLossBackward>)
output :  tensor([[160209.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2374344., grad_fn=<MseLossBackward>)
output :  tensor([[135440.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5233e+08, grad_fn=<MseLossBackward>)
output :  tensor([[150453.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2734682.2500, grad_fn=<MseLossBackward>)
output :  tensor([[184678.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(11033608., grad_fn=<MseLossBackward>)
output :  tensor([[171664.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(7098561., grad_fn=<MseLossBackward>)
output :  tensor([[182322.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(5391901.5000, grad_fn=<MseLossBackward>)
output :  tensor([[219173.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(683412.2500, grad_fn=<MseLossBackward>)
output :  tensor([[110642.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(7522763.5000, grad_fn=<MseLossBackward>)
output :  tensor([[134084.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(84347864., grad_fn=<MseLossBackward>)
output :  tensor([[284289.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2924207., grad_fn=<MseLossBackward>)
output :  tensor([[116982.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(965843.6250, grad_fn=<MseLossBackward>)
output :  tensor([[179653.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6278e+09, grad_fn=<MseLossBackward>)
output :  tensor([[182539.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(6053060.5000, grad_fn=<MseLossBackward>)
output :  tensor([[182887.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(6824258., grad_fn=<MseLossBackward>)
output :  tensor([[250707.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9010e+08, grad_fn=<MseLossBackward>)
output :  tensor([[219823.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(4738580.5000, grad_fn=<MseLossBackward>)
output :  tensor([[122087.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6203e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172814.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9263e+08, grad_fn=<MseLossBackward>)
output :  tensor([[122930.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(1144348.3750, grad_fn=<MseLossBackward>)
output :  tensor([[183336.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5251e+10, grad_fn=<MseLossBackward>)
output :  tensor([[151530.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2160348.7500, grad_fn=<MseLossBackward>)
output :  tensor([[153399.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(47609136., grad_fn=<MseLossBackward>)
output :  tensor([[203608.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(7246611.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145730.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7504e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175915.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(7203.7656, grad_fn=<MseLossBackward>)
output :  tensor([[255390.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8126e+08, grad_fn=<MseLossBackward>)
output :  tensor([[147534.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(216384.8750, grad_fn=<MseLossBackward>)
output :  tensor([[200146.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(6343236., grad_fn=<MseLossBackward>)
output :  tensor([[160737.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(619516.5625, grad_fn=<MseLossBackward>)
output :  tensor([[122249.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1730e+09, grad_fn=<MseLossBackward>)
output :  tensor([[134032.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2950343., grad_fn=<MseLossBackward>)
output :  tensor([[179711.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(18390562., grad_fn=<MseLossBackward>)
output :  tensor([[196079.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(36962220., grad_fn=<MseLossBackward>)
output :  tensor([[232493.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1930e+09, grad_fn=<MseLossBackward>)
output :  tensor([[254142.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(8163788.5000, grad_fn=<MseLossBackward>)
output :  tensor([[189666.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6727e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143986.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7548e+09, grad_fn=<MseLossBackward>)
output :  tensor([[139971.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(20504340., grad_fn=<MseLossBackward>)
output :  tensor([[71613.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9941e+08, grad_fn=<MseLossBackward>)
output :  tensor([[142854.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(61700288., grad_fn=<MseLossBackward>)
output :  tensor([[130145.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(1551951.5000, grad_fn=<MseLossBackward>)
output :  tensor([[154314.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(98772.7031, grad_fn=<MseLossBackward>)
output :  tensor([[126227.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(596297.6875, grad_fn=<MseLossBackward>)
output :  tensor([[78387.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(3561270.2500, grad_fn=<MseLossBackward>)
output :  tensor([[83602.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2568907.7500, grad_fn=<MseLossBackward>)
output :  tensor([[227799.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(17643412., grad_fn=<MseLossBackward>)
output :  tensor([[140597.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8946e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134111.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(13039434., grad_fn=<MseLossBackward>)
output :  tensor([[169791.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(7791251., grad_fn=<MseLossBackward>)
output :  tensor([[236643.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2700476., grad_fn=<MseLossBackward>)
output :  tensor([[186828.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(28209708., grad_fn=<MseLossBackward>)
output :  tensor([[157207.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1458735.5000, grad_fn=<MseLossBackward>)
output :  tensor([[198911.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1022310.5625, grad_fn=<MseLossBackward>)
output :  tensor([[204864.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0327e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137155.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(24185.1094, grad_fn=<MseLossBackward>)
output :  tensor([[154672.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(107164.1641, grad_fn=<MseLossBackward>)
output :  tensor([[135589.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(168202.5156, grad_fn=<MseLossBackward>)
output :  tensor([[201767.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9707e+08, grad_fn=<MseLossBackward>)
output :  tensor([[154467.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(218205.7656, grad_fn=<MseLossBackward>)
output :  tensor([[135185.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7377e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146063.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1352968.7500, grad_fn=<MseLossBackward>)
output :  tensor([[212719.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(517725.2188, grad_fn=<MseLossBackward>)
output :  tensor([[99060.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9105e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166896.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(363948.2812, grad_fn=<MseLossBackward>)
output :  tensor([[130855.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(8156691.5000, grad_fn=<MseLossBackward>)
output :  tensor([[147370.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(137525.0938, grad_fn=<MseLossBackward>)
output :  tensor([[105045.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8201e+09, grad_fn=<MseLossBackward>)
output :  tensor([[139314.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(3293034., grad_fn=<MseLossBackward>)
output :  tensor([[238481.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(6156756.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144264.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(541236.1250, grad_fn=<MseLossBackward>)
output :  tensor([[138476.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(953155.5625, grad_fn=<MseLossBackward>)
output :  tensor([[163071.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2300e+09, grad_fn=<MseLossBackward>)
output :  tensor([[272428.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(31037434., grad_fn=<MseLossBackward>)
output :  tensor([[170705.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(18440180., grad_fn=<MseLossBackward>)
output :  tensor([[104198.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(2024417.6250, grad_fn=<MseLossBackward>)
output :  tensor([[202641.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6037e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158176.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(677483.3125, grad_fn=<MseLossBackward>)
output :  tensor([[165059.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5099e+10, grad_fn=<MseLossBackward>)
output :  tensor([[97446.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(728128.8750, grad_fn=<MseLossBackward>)
output :  tensor([[122527.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(1149502.2500, grad_fn=<MseLossBackward>)
output :  tensor([[156136.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(18581.0977, grad_fn=<MseLossBackward>)
output :  tensor([[142790.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(7789506.5000, grad_fn=<MseLossBackward>)
output :  tensor([[201468.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2155161.7500, grad_fn=<MseLossBackward>)
output :  tensor([[143323.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1751735., grad_fn=<MseLossBackward>)
output :  tensor([[268247.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(35612920., grad_fn=<MseLossBackward>)
output :  tensor([[128013.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2259e+09, grad_fn=<MseLossBackward>)
output :  tensor([[165637.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(18944.9414, grad_fn=<MseLossBackward>)
output :  tensor([[188458.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1756.1338, grad_fn=<MseLossBackward>)
output :  tensor([[124230.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0251e+08, grad_fn=<MseLossBackward>)
output :  tensor([[250717.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(515389.3750, grad_fn=<MseLossBackward>)
output :  tensor([[159783.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4071e+08, grad_fn=<MseLossBackward>)
output :  tensor([[243762.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2519164.2500, grad_fn=<MseLossBackward>)
output :  tensor([[147538.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(12521314., grad_fn=<MseLossBackward>)
output :  tensor([[210634.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(402173.9688, grad_fn=<MseLossBackward>)
output :  tensor([[172749.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(122117.4844, grad_fn=<MseLossBackward>)
output :  tensor([[156124.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(4511973.5000, grad_fn=<MseLossBackward>)
output :  tensor([[119044.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1090523.3750, grad_fn=<MseLossBackward>)
output :  tensor([[240471.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1733e+09, grad_fn=<MseLossBackward>)
output :  tensor([[241157.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1340095.6250, grad_fn=<MseLossBackward>)
output :  tensor([[153413.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(5783.1270, grad_fn=<MseLossBackward>)
output :  tensor([[254826.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(5406.8447, grad_fn=<MseLossBackward>)
output :  tensor([[123311.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(77575080., grad_fn=<MseLossBackward>)
output :  tensor([[176280.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(78575.0938, grad_fn=<MseLossBackward>)
output :  tensor([[160474.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(224809.3281, grad_fn=<MseLossBackward>)
output :  tensor([[129828.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(1373455.8750, grad_fn=<MseLossBackward>)
output :  tensor([[191011.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7836e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164921.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(849623.0625, grad_fn=<MseLossBackward>)
output :  tensor([[165141.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(4584684., grad_fn=<MseLossBackward>)
output :  tensor([[158333.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(110982.6797, grad_fn=<MseLossBackward>)
output :  tensor([[147881.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(4073333., grad_fn=<MseLossBackward>)
output :  tensor([[170968.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7784e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158994.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1011627.3750, grad_fn=<MseLossBackward>)
output :  tensor([[380872.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(9593538., grad_fn=<MseLossBackward>)
output :  tensor([[128550.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2403178.2500, grad_fn=<MseLossBackward>)
output :  tensor([[130677.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0410e+09, grad_fn=<MseLossBackward>)
output :  tensor([[283380.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(4698327., grad_fn=<MseLossBackward>)
output :  tensor([[161521.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(228723.0625, grad_fn=<MseLossBackward>)
output :  tensor([[131352.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1779e+08, grad_fn=<MseLossBackward>)
output :  tensor([[232969.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(939233.5625, grad_fn=<MseLossBackward>)
output :  tensor([[179781.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(516040.1875, grad_fn=<MseLossBackward>)
output :  tensor([[152443.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(197108.2500, grad_fn=<MseLossBackward>)
output :  tensor([[143943.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1117216., grad_fn=<MseLossBackward>)
output :  tensor([[155459.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4447e+08, grad_fn=<MseLossBackward>)
output :  tensor([[101952.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(3813202., grad_fn=<MseLossBackward>)
output :  tensor([[70868.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1813e+08, grad_fn=<MseLossBackward>)
output :  tensor([[164451.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(300338.2500, grad_fn=<MseLossBackward>)
output :  tensor([[191752.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3139e+09, grad_fn=<MseLossBackward>)
output :  tensor([[156299.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2891647., grad_fn=<MseLossBackward>)
output :  tensor([[151202.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(39653784., grad_fn=<MseLossBackward>)
output :  tensor([[134675.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(7695249.5000, grad_fn=<MseLossBackward>)
output :  tensor([[205949.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(0.0088, grad_fn=<MseLossBackward>)
output :  tensor([[138609.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(371223.6562, grad_fn=<MseLossBackward>)
output :  tensor([[181687.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6464e+10, grad_fn=<MseLossBackward>)
output :  tensor([[149010.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(9063392., grad_fn=<MseLossBackward>)
output :  tensor([[112638.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7843e+08, grad_fn=<MseLossBackward>)
output :  tensor([[91268.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(7458745., grad_fn=<MseLossBackward>)
output :  tensor([[173515.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2204204.2500, grad_fn=<MseLossBackward>)
output :  tensor([[266987.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(43389804., grad_fn=<MseLossBackward>)
output :  tensor([[139164.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(5456020., grad_fn=<MseLossBackward>)
output :  tensor([[157574.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(5386243., grad_fn=<MseLossBackward>)
output :  tensor([[132065.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(189116.2656, grad_fn=<MseLossBackward>)
output :  tensor([[145899.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(12967088., grad_fn=<MseLossBackward>)
output :  tensor([[168637.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(543837.1250, grad_fn=<MseLossBackward>)
output :  tensor([[124043.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(8739322., grad_fn=<MseLossBackward>)
output :  tensor([[171371.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9544e+08, grad_fn=<MseLossBackward>)
output :  tensor([[158200.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1441312.7500, grad_fn=<MseLossBackward>)
output :  tensor([[116210.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(83624.8906, grad_fn=<MseLossBackward>)
output :  tensor([[161172.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1592e+09, grad_fn=<MseLossBackward>)
output :  tensor([[52832.6680]], grad_fn=<AddmmBackward>)
loss:  tensor(693335.9375, grad_fn=<MseLossBackward>)
output :  tensor([[232582.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3868e+09, grad_fn=<MseLossBackward>)
output :  tensor([[200392.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(368695.6250, grad_fn=<MseLossBackward>)
output :  tensor([[182696.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(5304960.5000, grad_fn=<MseLossBackward>)
output :  tensor([[104946.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1109533., grad_fn=<MseLossBackward>)
output :  tensor([[91350.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(18923928., grad_fn=<MseLossBackward>)
output :  tensor([[140624.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(390312.5625, grad_fn=<MseLossBackward>)
output :  tensor([[224720.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7996e+09, grad_fn=<MseLossBackward>)
output :  tensor([[205679.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(3315984., grad_fn=<MseLossBackward>)
output :  tensor([[166639.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(2686782., grad_fn=<MseLossBackward>)
output :  tensor([[175431.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0226e+09, grad_fn=<MseLossBackward>)
output :  tensor([[191002.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1004129.2500, grad_fn=<MseLossBackward>)
output :  tensor([[89407.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(5796282., grad_fn=<MseLossBackward>)
output :  tensor([[140395.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(156766.5000, grad_fn=<MseLossBackward>)
output :  tensor([[108825.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2804997., grad_fn=<MseLossBackward>)
output :  tensor([[144417.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(71521904., grad_fn=<MseLossBackward>)
output :  tensor([[171855.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6692e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195787.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(84869872., grad_fn=<MseLossBackward>)
output :  tensor([[180965.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(932612.6875, grad_fn=<MseLossBackward>)
output :  tensor([[97913.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1998070.6250, grad_fn=<MseLossBackward>)
output :  tensor([[120213.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(7362870.5000, grad_fn=<MseLossBackward>)
output :  tensor([[161345.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1321e+08, grad_fn=<MseLossBackward>)
output :  tensor([[197900.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(4405932., grad_fn=<MseLossBackward>)
output :  tensor([[143103.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(804020.4375, grad_fn=<MseLossBackward>)
train_loss: [2.5474002e+09]
epoch_result tensor([0.])
output :  tensor([[163138.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(21519596., grad_fn=<MseLossBackward>)
output :  tensor([[122707.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(499904.2500, grad_fn=<MseLossBackward>)
output :  tensor([[197972.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(14225862., grad_fn=<MseLossBackward>)
output :  tensor([[177714.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(510041.4688, grad_fn=<MseLossBackward>)
output :  tensor([[152613.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4448e+08, grad_fn=<MseLossBackward>)
output :  tensor([[125083.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(8505152., grad_fn=<MseLossBackward>)
output :  tensor([[144551.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(12610489., grad_fn=<MseLossBackward>)
output :  tensor([[119819.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(671759.5000, grad_fn=<MseLossBackward>)
output :  tensor([[64954.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(41664100., grad_fn=<MseLossBackward>)
output :  tensor([[167421.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(2020617.8750, grad_fn=<MseLossBackward>)
output :  tensor([[134984.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(25156180., grad_fn=<MseLossBackward>)
output :  tensor([[225769.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(592226.4375, grad_fn=<MseLossBackward>)
output :  tensor([[165565.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(11796864., grad_fn=<MseLossBackward>)
output :  tensor([[246589.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(9674044., grad_fn=<MseLossBackward>)
output :  tensor([[55337.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(114043.3984, grad_fn=<MseLossBackward>)
output :  tensor([[159815.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3457e+08, grad_fn=<MseLossBackward>)
output :  tensor([[168205.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(46159924., grad_fn=<MseLossBackward>)
output :  tensor([[164014.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(56472172., grad_fn=<MseLossBackward>)
output :  tensor([[272476.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(6366002., grad_fn=<MseLossBackward>)
output :  tensor([[195598.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1964070.8750, grad_fn=<MseLossBackward>)
output :  tensor([[139051.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4774e+10, grad_fn=<MseLossBackward>)
output :  tensor([[193796.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(6777.9199, grad_fn=<MseLossBackward>)
output :  tensor([[179422.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0682e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151521.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(271717.8438, grad_fn=<MseLossBackward>)
output :  tensor([[174238.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(17967664., grad_fn=<MseLossBackward>)
output :  tensor([[88292.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(8367596., grad_fn=<MseLossBackward>)
output :  tensor([[171164.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3831e+09, grad_fn=<MseLossBackward>)
output :  tensor([[183459.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2373910.5000, grad_fn=<MseLossBackward>)
output :  tensor([[208881.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1733e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113971.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(15773495., grad_fn=<MseLossBackward>)
output :  tensor([[172029.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1060642.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138012.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2289074.5000, grad_fn=<MseLossBackward>)
output :  tensor([[130851.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(3429180.5000, grad_fn=<MseLossBackward>)
output :  tensor([[119765.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(70540.0391, grad_fn=<MseLossBackward>)
output :  tensor([[143611.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0815e+08, grad_fn=<MseLossBackward>)
output :  tensor([[167887.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1642e+10, grad_fn=<MseLossBackward>)
output :  tensor([[150514.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(663970.3125, grad_fn=<MseLossBackward>)
output :  tensor([[180400.]], grad_fn=<AddmmBackward>)
loss:  tensor(160000., grad_fn=<MseLossBackward>)
output :  tensor([[141809.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(655897.5000, grad_fn=<MseLossBackward>)
output :  tensor([[103230.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7504e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134635.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4585e+09, grad_fn=<MseLossBackward>)
output :  tensor([[139392.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(19295154., grad_fn=<MseLossBackward>)
output :  tensor([[128484.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2204436.2500, grad_fn=<MseLossBackward>)
output :  tensor([[227028.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(4115763.2500, grad_fn=<MseLossBackward>)
output :  tensor([[131762.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(238083., grad_fn=<MseLossBackward>)
output :  tensor([[150011.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1022247.3750, grad_fn=<MseLossBackward>)
output :  tensor([[113175.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(1381488., grad_fn=<MseLossBackward>)
output :  tensor([[157175.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(7979389., grad_fn=<MseLossBackward>)
output :  tensor([[143602.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6417e+09, grad_fn=<MseLossBackward>)
output :  tensor([[190123.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3522777., grad_fn=<MseLossBackward>)
output :  tensor([[133397.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1108578.6250, grad_fn=<MseLossBackward>)
output :  tensor([[106308.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(13624923., grad_fn=<MseLossBackward>)
output :  tensor([[231138.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(8187109., grad_fn=<MseLossBackward>)
output :  tensor([[167776.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0897e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164119.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(26204960., grad_fn=<MseLossBackward>)
output :  tensor([[201225.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9335e+10, grad_fn=<MseLossBackward>)
output :  tensor([[248677.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1093e+10, grad_fn=<MseLossBackward>)
output :  tensor([[141968.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2346306., grad_fn=<MseLossBackward>)
output :  tensor([[135737.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3019883.7500, grad_fn=<MseLossBackward>)
output :  tensor([[155647.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(419782.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135321.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(28315368., grad_fn=<MseLossBackward>)
output :  tensor([[180133.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3787e+09, grad_fn=<MseLossBackward>)
output :  tensor([[181681.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(5848689., grad_fn=<MseLossBackward>)
output :  tensor([[158787.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(7358843., grad_fn=<MseLossBackward>)
output :  tensor([[133250.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(95060976., grad_fn=<MseLossBackward>)
output :  tensor([[141969.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(281629.2188, grad_fn=<MseLossBackward>)
output :  tensor([[149563.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(20828528., grad_fn=<MseLossBackward>)
output :  tensor([[175649.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1006e+09, grad_fn=<MseLossBackward>)
output :  tensor([[196760.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0965e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136995.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(245969.5000, grad_fn=<MseLossBackward>)
output :  tensor([[169305.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(6732241., grad_fn=<MseLossBackward>)
output :  tensor([[178239.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(7619670., grad_fn=<MseLossBackward>)
output :  tensor([[115842.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(709214., grad_fn=<MseLossBackward>)
output :  tensor([[224145.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(9895645., grad_fn=<MseLossBackward>)
output :  tensor([[190304.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(46297180., grad_fn=<MseLossBackward>)
output :  tensor([[124908.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(349761.3438, grad_fn=<MseLossBackward>)
output :  tensor([[195499.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1001656.9375, grad_fn=<MseLossBackward>)
output :  tensor([[169556.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(28554830., grad_fn=<MseLossBackward>)
output :  tensor([[213396.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9878e+10, grad_fn=<MseLossBackward>)
output :  tensor([[207987.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(9076380., grad_fn=<MseLossBackward>)
output :  tensor([[164003.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0893e+09, grad_fn=<MseLossBackward>)
output :  tensor([[191720.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(7726662.5000, grad_fn=<MseLossBackward>)
output :  tensor([[112244.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(570721.2500, grad_fn=<MseLossBackward>)
output :  tensor([[112730.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(53079.8398, grad_fn=<MseLossBackward>)
output :  tensor([[112795.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(632397.6875, grad_fn=<MseLossBackward>)
output :  tensor([[147439.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(408780.4062, grad_fn=<MseLossBackward>)
output :  tensor([[162240.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2545e+10, grad_fn=<MseLossBackward>)
output :  tensor([[178019.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(3921452., grad_fn=<MseLossBackward>)
output :  tensor([[128876.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(1896107.5000, grad_fn=<MseLossBackward>)
output :  tensor([[146937.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(3753724.5000, grad_fn=<MseLossBackward>)
output :  tensor([[180800.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1069e+09, grad_fn=<MseLossBackward>)
output :  tensor([[119031.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(4541660.5000, grad_fn=<MseLossBackward>)
output :  tensor([[196593.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(165432.8594, grad_fn=<MseLossBackward>)
output :  tensor([[147076.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(4312566., grad_fn=<MseLossBackward>)
output :  tensor([[213390.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(240268.4688, grad_fn=<MseLossBackward>)
output :  tensor([[126901.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(811857.3125, grad_fn=<MseLossBackward>)
output :  tensor([[248189.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(19117.3828, grad_fn=<MseLossBackward>)
output :  tensor([[239936.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0307e+09, grad_fn=<MseLossBackward>)
output :  tensor([[147695.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6556e+08, grad_fn=<MseLossBackward>)
output :  tensor([[85852.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1763e+08, grad_fn=<MseLossBackward>)
output :  tensor([[197918.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9261e+09, grad_fn=<MseLossBackward>)
output :  tensor([[80093.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(821359.8750, grad_fn=<MseLossBackward>)
output :  tensor([[140672.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1374060.1250, grad_fn=<MseLossBackward>)
output :  tensor([[76451.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(904727.9375, grad_fn=<MseLossBackward>)
output :  tensor([[145407.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(6025721., grad_fn=<MseLossBackward>)
output :  tensor([[176052.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2759.5322, grad_fn=<MseLossBackward>)
output :  tensor([[154823.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1751280., grad_fn=<MseLossBackward>)
output :  tensor([[110641.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(10510209., grad_fn=<MseLossBackward>)
output :  tensor([[206859.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1857e+10, grad_fn=<MseLossBackward>)
output :  tensor([[126746.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(3076433.7500, grad_fn=<MseLossBackward>)
output :  tensor([[269506.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1011e+08, grad_fn=<MseLossBackward>)
output :  tensor([[303812.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(38283996., grad_fn=<MseLossBackward>)
output :  tensor([[108399.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(809943.7500, grad_fn=<MseLossBackward>)
output :  tensor([[169780.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(7393895.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135002.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2911e+08, grad_fn=<MseLossBackward>)
output :  tensor([[140445.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2089018.5000, grad_fn=<MseLossBackward>)
output :  tensor([[130587.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(114148.9609, grad_fn=<MseLossBackward>)
output :  tensor([[126277.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1632285.7500, grad_fn=<MseLossBackward>)
output :  tensor([[133599.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8079e+08, grad_fn=<MseLossBackward>)
output :  tensor([[224829.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9271e+10, grad_fn=<MseLossBackward>)
output :  tensor([[194502.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1461e+10, grad_fn=<MseLossBackward>)
output :  tensor([[140077.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(14614373., grad_fn=<MseLossBackward>)
output :  tensor([[127305.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(37787.7148, grad_fn=<MseLossBackward>)
output :  tensor([[111413.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(26885.7500, grad_fn=<MseLossBackward>)
output :  tensor([[255132.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9600e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137488.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(6193099., grad_fn=<MseLossBackward>)
output :  tensor([[199647.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(11240409., grad_fn=<MseLossBackward>)
output :  tensor([[107986.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(9526193., grad_fn=<MseLossBackward>)
output :  tensor([[139525.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(180399.2969, grad_fn=<MseLossBackward>)
output :  tensor([[208702.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4957e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175840.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(16481063., grad_fn=<MseLossBackward>)
output :  tensor([[184389.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(372176.2500, grad_fn=<MseLossBackward>)
output :  tensor([[163707.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1110e+10, grad_fn=<MseLossBackward>)
output :  tensor([[306347.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2096e+08, grad_fn=<MseLossBackward>)
output :  tensor([[196075.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(3329826.5000, grad_fn=<MseLossBackward>)
output :  tensor([[257164.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1228e+10, grad_fn=<MseLossBackward>)
output :  tensor([[226281.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5775e+09, grad_fn=<MseLossBackward>)
output :  tensor([[291096.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7098e+08, grad_fn=<MseLossBackward>)
output :  tensor([[224428.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(183585.4688, grad_fn=<MseLossBackward>)
output :  tensor([[224648.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8006e+10, grad_fn=<MseLossBackward>)
output :  tensor([[200268.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(10685033., grad_fn=<MseLossBackward>)
output :  tensor([[158395.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(8.6409e+08, grad_fn=<MseLossBackward>)
output :  tensor([[138812.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(39842528., grad_fn=<MseLossBackward>)
output :  tensor([[136683.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1401264., grad_fn=<MseLossBackward>)
output :  tensor([[92130.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1278630.8750, grad_fn=<MseLossBackward>)
output :  tensor([[110164.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(4683538.5000, grad_fn=<MseLossBackward>)
output :  tensor([[272292.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2044e+09, grad_fn=<MseLossBackward>)
output :  tensor([[230360.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(21525106., grad_fn=<MseLossBackward>)
output :  tensor([[147173.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(4725461., grad_fn=<MseLossBackward>)
output :  tensor([[137420.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(6278.0859, grad_fn=<MseLossBackward>)
output :  tensor([[174463.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(533356.3750, grad_fn=<MseLossBackward>)
output :  tensor([[143867.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1910960.6250, grad_fn=<MseLossBackward>)
output :  tensor([[164389.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(9.0665e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163591.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1985060.8750, grad_fn=<MseLossBackward>)
output :  tensor([[135416.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2506482.7500, grad_fn=<MseLossBackward>)
output :  tensor([[189164.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4441e+09, grad_fn=<MseLossBackward>)
output :  tensor([[112125.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(15711.0557, grad_fn=<MseLossBackward>)
output :  tensor([[170864.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1288615.1250, grad_fn=<MseLossBackward>)
output :  tensor([[123123.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(9754642., grad_fn=<MseLossBackward>)
output :  tensor([[87757.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(573995.6250, grad_fn=<MseLossBackward>)
output :  tensor([[179585.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(171745.4844, grad_fn=<MseLossBackward>)
output :  tensor([[108547.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1830059.3750, grad_fn=<MseLossBackward>)
output :  tensor([[236529.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(6102289.5000, grad_fn=<MseLossBackward>)
output :  tensor([[242863.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(4564966., grad_fn=<MseLossBackward>)
output :  tensor([[132490.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(8941595., grad_fn=<MseLossBackward>)
output :  tensor([[107106.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(3433551., grad_fn=<MseLossBackward>)
output :  tensor([[288467.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2108e+10, grad_fn=<MseLossBackward>)
output :  tensor([[170189.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1717205.5000, grad_fn=<MseLossBackward>)
output :  tensor([[126606.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2580641.5000, grad_fn=<MseLossBackward>)
output :  tensor([[143008.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2541e+08, grad_fn=<MseLossBackward>)
output :  tensor([[204202.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(95985800., grad_fn=<MseLossBackward>)
output :  tensor([[143390.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(5714042., grad_fn=<MseLossBackward>)
output :  tensor([[158971.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4648e+10, grad_fn=<MseLossBackward>)
output :  tensor([[152367.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2347072., grad_fn=<MseLossBackward>)
output :  tensor([[129909.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(167882.2656, grad_fn=<MseLossBackward>)
output :  tensor([[248582.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6878e+10, grad_fn=<MseLossBackward>)
output :  tensor([[395325.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(44552288., grad_fn=<MseLossBackward>)
output :  tensor([[105313.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(13593162., grad_fn=<MseLossBackward>)
output :  tensor([[110099.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(70573520., grad_fn=<MseLossBackward>)
output :  tensor([[158268.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1517747., grad_fn=<MseLossBackward>)
output :  tensor([[130426.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5571e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163781.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3894e+09, grad_fn=<MseLossBackward>)
output :  tensor([[170359.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6433e+09, grad_fn=<MseLossBackward>)
output :  tensor([[106635.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(9217201., grad_fn=<MseLossBackward>)
output :  tensor([[140805.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(37830.2500, grad_fn=<MseLossBackward>)
output :  tensor([[367421.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(16328.0479, grad_fn=<MseLossBackward>)
output :  tensor([[208958.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0288e+09, grad_fn=<MseLossBackward>)
output :  tensor([[175782.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(79753.2891, grad_fn=<MseLossBackward>)
output :  tensor([[201405.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2233810.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139507.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(257318.4219, grad_fn=<MseLossBackward>)
output :  tensor([[193870.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(396191.5625, grad_fn=<MseLossBackward>)
output :  tensor([[137295.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8778e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181164.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(26957.5352, grad_fn=<MseLossBackward>)
output :  tensor([[240553.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2092769.1250, grad_fn=<MseLossBackward>)
output :  tensor([[176666.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(7107972.5000, grad_fn=<MseLossBackward>)
output :  tensor([[109798.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(3234827., grad_fn=<MseLossBackward>)
output :  tensor([[265811.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1564297.3750, grad_fn=<MseLossBackward>)
output :  tensor([[269081.]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6408e+08, grad_fn=<MseLossBackward>)
output :  tensor([[120064.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(8617986., grad_fn=<MseLossBackward>)
output :  tensor([[219226.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1107e+09, grad_fn=<MseLossBackward>)
output :  tensor([[306800.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4222e+08, grad_fn=<MseLossBackward>)
output :  tensor([[208764.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(3113846.2500, grad_fn=<MseLossBackward>)
output :  tensor([[216387.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5280e+10, grad_fn=<MseLossBackward>)
output :  tensor([[158184.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(81135.9609, grad_fn=<MseLossBackward>)
output :  tensor([[168263.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2980262.7500, grad_fn=<MseLossBackward>)
output :  tensor([[162159.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(27325286., grad_fn=<MseLossBackward>)
output :  tensor([[170241.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(58171.4102, grad_fn=<MseLossBackward>)
output :  tensor([[235288.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0700e+09, grad_fn=<MseLossBackward>)
output :  tensor([[223246.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(38558084., grad_fn=<MseLossBackward>)
output :  tensor([[160486.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8187e+08, grad_fn=<MseLossBackward>)
output :  tensor([[121796.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1447321.7500, grad_fn=<MseLossBackward>)
output :  tensor([[178762.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(3105139.5000, grad_fn=<MseLossBackward>)
output :  tensor([[180562.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3103e+09, grad_fn=<MseLossBackward>)
output :  tensor([[209546.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4251e+10, grad_fn=<MseLossBackward>)
output :  tensor([[137339.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(8451103., grad_fn=<MseLossBackward>)
output :  tensor([[149298.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6718e+08, grad_fn=<MseLossBackward>)
output :  tensor([[272532.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(19960510., grad_fn=<MseLossBackward>)
output :  tensor([[90675.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(32208640., grad_fn=<MseLossBackward>)
output :  tensor([[236166.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(111514.2500, grad_fn=<MseLossBackward>)
output :  tensor([[262026.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0298e+11, grad_fn=<MseLossBackward>)
output :  tensor([[168953.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1095685.5000, grad_fn=<MseLossBackward>)
output :  tensor([[193857.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6927e+09, grad_fn=<MseLossBackward>)
output :  tensor([[153477.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2319338.7500, grad_fn=<MseLossBackward>)
output :  tensor([[207123.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9534e+09, grad_fn=<MseLossBackward>)
output :  tensor([[128081.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(844230.7500, grad_fn=<MseLossBackward>)
output :  tensor([[148524.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(12418906., grad_fn=<MseLossBackward>)
output :  tensor([[167539.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2699e+08, grad_fn=<MseLossBackward>)
output :  tensor([[184355.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2234744.7500, grad_fn=<MseLossBackward>)
output :  tensor([[128661.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(7082958.5000, grad_fn=<MseLossBackward>)
output :  tensor([[136889.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(151564.2188, grad_fn=<MseLossBackward>)
output :  tensor([[179610.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(43698296., grad_fn=<MseLossBackward>)
output :  tensor([[195860.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9310e+09, grad_fn=<MseLossBackward>)
output :  tensor([[239513.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(12157643., grad_fn=<MseLossBackward>)
output :  tensor([[152533.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(6083082.5000, grad_fn=<MseLossBackward>)
output :  tensor([[196223.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(50043.0898, grad_fn=<MseLossBackward>)
output :  tensor([[163636.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8560e+08, grad_fn=<MseLossBackward>)
output :  tensor([[182268.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(7667015., grad_fn=<MseLossBackward>)
output :  tensor([[180530.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(397057.5000, grad_fn=<MseLossBackward>)
output :  tensor([[97788.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(621054.8125, grad_fn=<MseLossBackward>)
output :  tensor([[171544.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1763e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134352.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(418669.6562, grad_fn=<MseLossBackward>)
output :  tensor([[123259.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(68222176., grad_fn=<MseLossBackward>)
output :  tensor([[175370.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1878741.3750, grad_fn=<MseLossBackward>)
output :  tensor([[82953.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(4186755.5000, grad_fn=<MseLossBackward>)
output :  tensor([[280204.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(95959168., grad_fn=<MseLossBackward>)
output :  tensor([[167893.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(8373608., grad_fn=<MseLossBackward>)
output :  tensor([[188580.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0905e+10, grad_fn=<MseLossBackward>)
output :  tensor([[249398.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6661e+08, grad_fn=<MseLossBackward>)
output :  tensor([[155625.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(21397708., grad_fn=<MseLossBackward>)
output :  tensor([[122643.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1840473.7500, grad_fn=<MseLossBackward>)
output :  tensor([[119023.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(768992., grad_fn=<MseLossBackward>)
output :  tensor([[141524.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0353e+08, grad_fn=<MseLossBackward>)
output :  tensor([[170753.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(10536617., grad_fn=<MseLossBackward>)
output :  tensor([[111193.1016]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2329e+08, grad_fn=<MseLossBackward>)
output :  tensor([[212479.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1135e+10, grad_fn=<MseLossBackward>)
output :  tensor([[231410.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0180e+08, grad_fn=<MseLossBackward>)
output :  tensor([[254829.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9702e+10, grad_fn=<MseLossBackward>)
output :  tensor([[222751.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6400e+08, grad_fn=<MseLossBackward>)
output :  tensor([[195256.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4459e+10, grad_fn=<MseLossBackward>)
output :  tensor([[186959.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(292511.9688, grad_fn=<MseLossBackward>)
output :  tensor([[207648.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7185e+10, grad_fn=<MseLossBackward>)
output :  tensor([[192089.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0710e+10, grad_fn=<MseLossBackward>)
output :  tensor([[177173.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2452551.7500, grad_fn=<MseLossBackward>)
output :  tensor([[149584.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(5833357., grad_fn=<MseLossBackward>)
output :  tensor([[337492.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(243018.1875, grad_fn=<MseLossBackward>)
output :  tensor([[207309.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(22001962., grad_fn=<MseLossBackward>)
output :  tensor([[157375.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(6888164.5000, grad_fn=<MseLossBackward>)
output :  tensor([[188452.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8140e+09, grad_fn=<MseLossBackward>)
output :  tensor([[102350.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(7020885., grad_fn=<MseLossBackward>)
output :  tensor([[278788.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6293e+10, grad_fn=<MseLossBackward>)
output :  tensor([[173430.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(220151.5781, grad_fn=<MseLossBackward>)
output :  tensor([[216038.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(6442158., grad_fn=<MseLossBackward>)
output :  tensor([[215188.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(33776984., grad_fn=<MseLossBackward>)
output :  tensor([[176817.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(5676232., grad_fn=<MseLossBackward>)
output :  tensor([[200700.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1209725., grad_fn=<MseLossBackward>)
output :  tensor([[153380.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2621970.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144837.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0104e+09, grad_fn=<MseLossBackward>)
output :  tensor([[117408.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1190587.8750, grad_fn=<MseLossBackward>)
output :  tensor([[141882.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(3543512., grad_fn=<MseLossBackward>)
output :  tensor([[150046.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1095620.1250, grad_fn=<MseLossBackward>)
output :  tensor([[202467.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5758e+10, grad_fn=<MseLossBackward>)
output :  tensor([[162216.]], grad_fn=<AddmmBackward>)
loss:  tensor(7376656., grad_fn=<MseLossBackward>)
output :  tensor([[100938.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(2070024., grad_fn=<MseLossBackward>)
output :  tensor([[226235.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8947e+08, grad_fn=<MseLossBackward>)
output :  tensor([[184758.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7089e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176673.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(35461.5977, grad_fn=<MseLossBackward>)
output :  tensor([[80850.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(1320757.6250, grad_fn=<MseLossBackward>)
output :  tensor([[128170.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(108323.2656, grad_fn=<MseLossBackward>)
output :  tensor([[213902.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(9597.8760, grad_fn=<MseLossBackward>)
output :  tensor([[143285.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(510063.7812, grad_fn=<MseLossBackward>)
output :  tensor([[129119.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(775032.6250, grad_fn=<MseLossBackward>)
output :  tensor([[145686.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(9526386., grad_fn=<MseLossBackward>)
output :  tensor([[176647.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5325e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144454.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(206385.6562, grad_fn=<MseLossBackward>)
output :  tensor([[161259.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1586379.6250, grad_fn=<MseLossBackward>)
output :  tensor([[215130.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(16932.5156, grad_fn=<MseLossBackward>)
output :  tensor([[135215.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(9.1300e+08, grad_fn=<MseLossBackward>)
output :  tensor([[258294.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(10855583., grad_fn=<MseLossBackward>)
output :  tensor([[161201.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2895740.2500, grad_fn=<MseLossBackward>)
output :  tensor([[130544.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4181769.5000, grad_fn=<MseLossBackward>)
output :  tensor([[94327.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(452645.1250, grad_fn=<MseLossBackward>)
output :  tensor([[154107.]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8451e+09, grad_fn=<MseLossBackward>)
output :  tensor([[179987.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(7618.0166, grad_fn=<MseLossBackward>)
output :  tensor([[122498.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(3994377., grad_fn=<MseLossBackward>)
output :  tensor([[190836.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4526e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144561.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2329e+09, grad_fn=<MseLossBackward>)
output :  tensor([[149941.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1741.7581, grad_fn=<MseLossBackward>)
output :  tensor([[188236.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(236758.2656, grad_fn=<MseLossBackward>)
output :  tensor([[253034.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6034e+09, grad_fn=<MseLossBackward>)
output :  tensor([[87796.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(13719095., grad_fn=<MseLossBackward>)
output :  tensor([[238874.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1267242.7500, grad_fn=<MseLossBackward>)
output :  tensor([[130119.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(2623159.7500, grad_fn=<MseLossBackward>)
output :  tensor([[164941.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0193e+10, grad_fn=<MseLossBackward>)
output :  tensor([[112885.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6605e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174796.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1447848.1250, grad_fn=<MseLossBackward>)
output :  tensor([[161638.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9455e+08, grad_fn=<MseLossBackward>)
output :  tensor([[153302.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1997e+08, grad_fn=<MseLossBackward>)
output :  tensor([[237459.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2371840.7500, grad_fn=<MseLossBackward>)
output :  tensor([[224510.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1216e+09, grad_fn=<MseLossBackward>)
output :  tensor([[127036.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1324.2776, grad_fn=<MseLossBackward>)
output :  tensor([[126284.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(81082.5625, grad_fn=<MseLossBackward>)
output :  tensor([[225373.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2645909., grad_fn=<MseLossBackward>)
output :  tensor([[231019.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(8880679., grad_fn=<MseLossBackward>)
output :  tensor([[229908.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(10297280., grad_fn=<MseLossBackward>)
output :  tensor([[145296.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(7307138., grad_fn=<MseLossBackward>)
output :  tensor([[209578.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(178018.0625, grad_fn=<MseLossBackward>)
output :  tensor([[126881.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(47349020., grad_fn=<MseLossBackward>)
output :  tensor([[135411.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(8475922., grad_fn=<MseLossBackward>)
output :  tensor([[313162.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3375372.7500, grad_fn=<MseLossBackward>)
output :  tensor([[137324.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(13508496., grad_fn=<MseLossBackward>)
output :  tensor([[120903.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9056e+09, grad_fn=<MseLossBackward>)
output :  tensor([[108231.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(1609984.2500, grad_fn=<MseLossBackward>)
output :  tensor([[156996.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4037e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180751.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8310e+09, grad_fn=<MseLossBackward>)
output :  tensor([[176501.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(12261268., grad_fn=<MseLossBackward>)
output :  tensor([[195829.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(26736332., grad_fn=<MseLossBackward>)
output :  tensor([[99000.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(999203.3125, grad_fn=<MseLossBackward>)
output :  tensor([[181547.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(6491428., grad_fn=<MseLossBackward>)
output :  tensor([[168481.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(338142.2500, grad_fn=<MseLossBackward>)
output :  tensor([[142448.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(11893661., grad_fn=<MseLossBackward>)
output :  tensor([[265679.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7273e+09, grad_fn=<MseLossBackward>)
output :  tensor([[141978.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2466e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173663.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(440418.8750, grad_fn=<MseLossBackward>)
output :  tensor([[141241.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1540430., grad_fn=<MseLossBackward>)
output :  tensor([[202509.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(4036395., grad_fn=<MseLossBackward>)
output :  tensor([[169156.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(711070.5625, grad_fn=<MseLossBackward>)
output :  tensor([[241472.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(6388651., grad_fn=<MseLossBackward>)
output :  tensor([[133343.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1338468.2500, grad_fn=<MseLossBackward>)
output :  tensor([[151171.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(3316439.2500, grad_fn=<MseLossBackward>)
output :  tensor([[210078.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(24217778., grad_fn=<MseLossBackward>)
output :  tensor([[170059.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(25594430., grad_fn=<MseLossBackward>)
output :  tensor([[192872.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(14996014., grad_fn=<MseLossBackward>)
output :  tensor([[132032.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2723e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129184.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(34155.6602, grad_fn=<MseLossBackward>)
output :  tensor([[136056.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(15554273., grad_fn=<MseLossBackward>)
output :  tensor([[205028.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1566e+09, grad_fn=<MseLossBackward>)
output :  tensor([[167592.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7659e+09, grad_fn=<MseLossBackward>)
output :  tensor([[72564.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5786e+08, grad_fn=<MseLossBackward>)
output :  tensor([[92881.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(70242208., grad_fn=<MseLossBackward>)
output :  tensor([[253442.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(22415.7031, grad_fn=<MseLossBackward>)
output :  tensor([[201557.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9134e+09, grad_fn=<MseLossBackward>)
output :  tensor([[115748.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(560357.5000, grad_fn=<MseLossBackward>)
output :  tensor([[157919.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7499e+08, grad_fn=<MseLossBackward>)
output :  tensor([[208683.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2806e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179122.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2587e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157064.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(4260676.5000, grad_fn=<MseLossBackward>)
output :  tensor([[170693.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(480487.2500, grad_fn=<MseLossBackward>)
output :  tensor([[117968.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(8810508., grad_fn=<MseLossBackward>)
output :  tensor([[159512.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(20361952., grad_fn=<MseLossBackward>)
output :  tensor([[194221.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6074e+08, grad_fn=<MseLossBackward>)
output :  tensor([[221070.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2467844.7500, grad_fn=<MseLossBackward>)
output :  tensor([[245856.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4914e+11, grad_fn=<MseLossBackward>)
output :  tensor([[145964.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1071419.1250, grad_fn=<MseLossBackward>)
output :  tensor([[109147.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(445472.8125, grad_fn=<MseLossBackward>)
output :  tensor([[169766.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4723e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148256.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(5031960.5000, grad_fn=<MseLossBackward>)
output :  tensor([[235741.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1583940.2500, grad_fn=<MseLossBackward>)
output :  tensor([[115332.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(110431.5938, grad_fn=<MseLossBackward>)
output :  tensor([[182342.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(310754., grad_fn=<MseLossBackward>)
output :  tensor([[186939.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(57292.9102, grad_fn=<MseLossBackward>)
output :  tensor([[164802.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4086e+10, grad_fn=<MseLossBackward>)
output :  tensor([[93555.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5764e+08, grad_fn=<MseLossBackward>)
output :  tensor([[242014.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(9090131., grad_fn=<MseLossBackward>)
output :  tensor([[174748.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1565900.2500, grad_fn=<MseLossBackward>)
output :  tensor([[138758.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1541361., grad_fn=<MseLossBackward>)
output :  tensor([[233717.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1643844.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163284.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(80993.6016, grad_fn=<MseLossBackward>)
output :  tensor([[203723.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4708e+10, grad_fn=<MseLossBackward>)
output :  tensor([[129977.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(25229588., grad_fn=<MseLossBackward>)
output :  tensor([[185946.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7343e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137590.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2530137.5000, grad_fn=<MseLossBackward>)
output :  tensor([[228195.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(60904124., grad_fn=<MseLossBackward>)
output :  tensor([[225448.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0279e+08, grad_fn=<MseLossBackward>)
output :  tensor([[91756.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(3085100.2500, grad_fn=<MseLossBackward>)
output :  tensor([[161116.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2830964., grad_fn=<MseLossBackward>)
output :  tensor([[247578.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5203e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145731.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(535320.8750, grad_fn=<MseLossBackward>)
output :  tensor([[109740.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8267e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161546.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(8721224., grad_fn=<MseLossBackward>)
output :  tensor([[144395.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(156123.7656, grad_fn=<MseLossBackward>)
output :  tensor([[129581.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1908758.1250, grad_fn=<MseLossBackward>)
output :  tensor([[189467.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8347e+09, grad_fn=<MseLossBackward>)
output :  tensor([[122599.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(9862.9727, grad_fn=<MseLossBackward>)
output :  tensor([[154601.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(6769022., grad_fn=<MseLossBackward>)
output :  tensor([[168249.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(12256235., grad_fn=<MseLossBackward>)
output :  tensor([[147232.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(14196529., grad_fn=<MseLossBackward>)
output :  tensor([[162754.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(21124.8047, grad_fn=<MseLossBackward>)
output :  tensor([[135940.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2580e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130378.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2629161., grad_fn=<MseLossBackward>)
output :  tensor([[153949.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2350e+08, grad_fn=<MseLossBackward>)
output :  tensor([[146244.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(4377052.5000, grad_fn=<MseLossBackward>)
output :  tensor([[164112.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(5579708.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135333.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4687e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148195.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(365817.0625, grad_fn=<MseLossBackward>)
output :  tensor([[183075.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(24250546., grad_fn=<MseLossBackward>)
output :  tensor([[168824.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(30959.5020, grad_fn=<MseLossBackward>)
output :  tensor([[179755.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(59810.8164, grad_fn=<MseLossBackward>)
output :  tensor([[221191.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1420081.8750, grad_fn=<MseLossBackward>)
output :  tensor([[112091.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(17570702., grad_fn=<MseLossBackward>)
output :  tensor([[137101.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4887e+08, grad_fn=<MseLossBackward>)
output :  tensor([[283462.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(6439699., grad_fn=<MseLossBackward>)
output :  tensor([[118050.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(4203589., grad_fn=<MseLossBackward>)
output :  tensor([[177788.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7818e+09, grad_fn=<MseLossBackward>)
output :  tensor([[183471.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2337554.2500, grad_fn=<MseLossBackward>)
output :  tensor([[188757.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(10609983., grad_fn=<MseLossBackward>)
output :  tensor([[248789.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8700e+08, grad_fn=<MseLossBackward>)
output :  tensor([[222796.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(635134.3125, grad_fn=<MseLossBackward>)
output :  tensor([[118944.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7016e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172697.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8801e+08, grad_fn=<MseLossBackward>)
output :  tensor([[125694.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2871701., grad_fn=<MseLossBackward>)
output :  tensor([[183137.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5353e+10, grad_fn=<MseLossBackward>)
output :  tensor([[153123.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(15140.5332, grad_fn=<MseLossBackward>)
output :  tensor([[153325.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(46584464., grad_fn=<MseLossBackward>)
output :  tensor([[204021.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(5193556., grad_fn=<MseLossBackward>)
output :  tensor([[144389.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4136e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174596.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1970207., grad_fn=<MseLossBackward>)
output :  tensor([[252845.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1048e+08, grad_fn=<MseLossBackward>)
output :  tensor([[150073.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(4300698.5000, grad_fn=<MseLossBackward>)
output :  tensor([[199981.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(7199243.5000, grad_fn=<MseLossBackward>)
output :  tensor([[159959.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(83.8369, grad_fn=<MseLossBackward>)
output :  tensor([[120876.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0808e+09, grad_fn=<MseLossBackward>)
output :  tensor([[133180.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(6603856., grad_fn=<MseLossBackward>)
output :  tensor([[180580.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(11692873., grad_fn=<MseLossBackward>)
output :  tensor([[200360.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0735e+08, grad_fn=<MseLossBackward>)
output :  tensor([[238719.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5281e+09, grad_fn=<MseLossBackward>)
output :  tensor([[252494.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(20297560., grad_fn=<MseLossBackward>)
output :  tensor([[188893.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6928e+10, grad_fn=<MseLossBackward>)
output :  tensor([[141539.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5039e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145364.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(747225.1875, grad_fn=<MseLossBackward>)
output :  tensor([[70121.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(9.0732e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133350.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2719355.5000, grad_fn=<MseLossBackward>)
output :  tensor([[126120.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(7725707., grad_fn=<MseLossBackward>)
output :  tensor([[155785.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(3188066., grad_fn=<MseLossBackward>)
output :  tensor([[132151.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(26541012., grad_fn=<MseLossBackward>)
output :  tensor([[74511.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(3955592.7500, grad_fn=<MseLossBackward>)
output :  tensor([[82704.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(495836.0312, grad_fn=<MseLossBackward>)
output :  tensor([[239462.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(55682144., grad_fn=<MseLossBackward>)
output :  tensor([[140766.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9899e+08, grad_fn=<MseLossBackward>)
output :  tensor([[126921.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(12803314., grad_fn=<MseLossBackward>)
output :  tensor([[167643.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(414293.3750, grad_fn=<MseLossBackward>)
output :  tensor([[235567.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(322517.5000, grad_fn=<MseLossBackward>)
output :  tensor([[190608.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2344056.7500, grad_fn=<MseLossBackward>)
output :  tensor([[154782.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1481469.3750, grad_fn=<MseLossBackward>)
output :  tensor([[199679.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(3165675., grad_fn=<MseLossBackward>)
output :  tensor([[205659.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(9.8223e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135428.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2468286.5000, grad_fn=<MseLossBackward>)
output :  tensor([[155333.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(110909.8125, grad_fn=<MseLossBackward>)
output :  tensor([[136782.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(612844.3125, grad_fn=<MseLossBackward>)
output :  tensor([[200219.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8688e+08, grad_fn=<MseLossBackward>)
output :  tensor([[149655.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(18877260., grad_fn=<MseLossBackward>)
output :  tensor([[134168.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6539e+09, grad_fn=<MseLossBackward>)
output :  tensor([[143180.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2956035.5000, grad_fn=<MseLossBackward>)
output :  tensor([[207990.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(16079849., grad_fn=<MseLossBackward>)
output :  tensor([[98613.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7600e+08, grad_fn=<MseLossBackward>)
output :  tensor([[166726.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(597818.9375, grad_fn=<MseLossBackward>)
output :  tensor([[129241.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1540934.2500, grad_fn=<MseLossBackward>)
output :  tensor([[143421.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(12807340., grad_fn=<MseLossBackward>)
output :  tensor([[101366.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5197e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137637.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(18859.0137, grad_fn=<MseLossBackward>)
output :  tensor([[233650.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(5521619., grad_fn=<MseLossBackward>)
output :  tensor([[143270.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2992197.2500, grad_fn=<MseLossBackward>)
output :  tensor([[139629.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(4534570.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162588.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1964e+09, grad_fn=<MseLossBackward>)
output :  tensor([[272468.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(30594380., grad_fn=<MseLossBackward>)
output :  tensor([[171006.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(15944548., grad_fn=<MseLossBackward>)
output :  tensor([[103827.]], grad_fn=<AddmmBackward>)
loss:  tensor(1104601., grad_fn=<MseLossBackward>)
output :  tensor([[201985.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7025e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161987.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(8926743., grad_fn=<MseLossBackward>)
output :  tensor([[164014.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5544e+10, grad_fn=<MseLossBackward>)
output :  tensor([[100045.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(3047343., grad_fn=<MseLossBackward>)
output :  tensor([[123979.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(144281.2812, grad_fn=<MseLossBackward>)
output :  tensor([[155831.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(28476.5625, grad_fn=<MseLossBackward>)
output :  tensor([[141337.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1789616.8750, grad_fn=<MseLossBackward>)
output :  tensor([[199352.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(419762.2500, grad_fn=<MseLossBackward>)
output :  tensor([[139047.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(8718917., grad_fn=<MseLossBackward>)
output :  tensor([[263046.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(586803.8750, grad_fn=<MseLossBackward>)
output :  tensor([[125369.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0478e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164716.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(614558., grad_fn=<MseLossBackward>)
output :  tensor([[190193.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2866884., grad_fn=<MseLossBackward>)
output :  tensor([[121965.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4317e+08, grad_fn=<MseLossBackward>)
output :  tensor([[244368.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(31712736., grad_fn=<MseLossBackward>)
output :  tensor([[159385.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6254e+08, grad_fn=<MseLossBackward>)
output :  tensor([[247307.]], grad_fn=<AddmmBackward>)
loss:  tensor(3829849., grad_fn=<MseLossBackward>)
output :  tensor([[149192.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(26964978., grad_fn=<MseLossBackward>)
output :  tensor([[209543.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(208292.4062, grad_fn=<MseLossBackward>)
output :  tensor([[171730.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(448000.1250, grad_fn=<MseLossBackward>)
output :  tensor([[155686.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2842648.7500, grad_fn=<MseLossBackward>)
output :  tensor([[118111.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(12338.3496, grad_fn=<MseLossBackward>)
output :  tensor([[241693.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0608e+09, grad_fn=<MseLossBackward>)
output :  tensor([[235837.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(17326276., grad_fn=<MseLossBackward>)
output :  tensor([[151717.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2623843.2500, grad_fn=<MseLossBackward>)
output :  tensor([[253079.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(3314675.5000, grad_fn=<MseLossBackward>)
output :  tensor([[125387.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1844e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174747.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1569891.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162558.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(6548161., grad_fn=<MseLossBackward>)
output :  tensor([[131276.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(76219.1328, grad_fn=<MseLossBackward>)
output :  tensor([[190651.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7395e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166359.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(5568862.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163702.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(493703.8438, grad_fn=<MseLossBackward>)
output :  tensor([[157731.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(72100.6406, grad_fn=<MseLossBackward>)
output :  tensor([[148752.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1317868.1250, grad_fn=<MseLossBackward>)
output :  tensor([[171090.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7934e+09, grad_fn=<MseLossBackward>)
output :  tensor([[160671.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(450765.3750, grad_fn=<MseLossBackward>)
output :  tensor([[380753.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(10347280., grad_fn=<MseLossBackward>)
output :  tensor([[114820.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4834e+08, grad_fn=<MseLossBackward>)
output :  tensor([[132067.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1685e+09, grad_fn=<MseLossBackward>)
output :  tensor([[278845.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(5604168.5000, grad_fn=<MseLossBackward>)
output :  tensor([[161104.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(802452.0625, grad_fn=<MseLossBackward>)
output :  tensor([[130908.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0835e+08, grad_fn=<MseLossBackward>)
output :  tensor([[218157.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9160e+08, grad_fn=<MseLossBackward>)
output :  tensor([[183032.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(6414822.5000, grad_fn=<MseLossBackward>)
output :  tensor([[153553.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2412974., grad_fn=<MseLossBackward>)
output :  tensor([[145958.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(918392.8125, grad_fn=<MseLossBackward>)
output :  tensor([[153137.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6365e+08, grad_fn=<MseLossBackward>)
output :  tensor([[101982.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(3931669.2500, grad_fn=<MseLossBackward>)
output :  tensor([[72836.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6477e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163519.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2191880.2500, grad_fn=<MseLossBackward>)
output :  tensor([[191794.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3109e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164712.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(45062272., grad_fn=<MseLossBackward>)
output :  tensor([[163221.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(32741106., grad_fn=<MseLossBackward>)
output :  tensor([[138192.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(551631.1250, grad_fn=<MseLossBackward>)
output :  tensor([[205458.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(241526.1719, grad_fn=<MseLossBackward>)
output :  tensor([[139952.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(3810731., grad_fn=<MseLossBackward>)
output :  tensor([[182073.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6365e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145084.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(837282.1875, grad_fn=<MseLossBackward>)
output :  tensor([[107942.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2214e+08, grad_fn=<MseLossBackward>)
output :  tensor([[92970.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1060192., grad_fn=<MseLossBackward>)
output :  tensor([[174691.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(95172.2500, grad_fn=<MseLossBackward>)
output :  tensor([[261396.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(993759.7500, grad_fn=<MseLossBackward>)
output :  tensor([[139834.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2774202.5000, grad_fn=<MseLossBackward>)
output :  tensor([[158482.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1995862.5000, grad_fn=<MseLossBackward>)
output :  tensor([[134761.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(5113534., grad_fn=<MseLossBackward>)
output :  tensor([[148544.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(912651.8125, grad_fn=<MseLossBackward>)
output :  tensor([[166122.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(3161006.2500, grad_fn=<MseLossBackward>)
output :  tensor([[126885.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(13190.8818, grad_fn=<MseLossBackward>)
output :  tensor([[169255.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8832e+08, grad_fn=<MseLossBackward>)
output :  tensor([[160958.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(15668609., grad_fn=<MseLossBackward>)
output :  tensor([[117660.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1347775.8750, grad_fn=<MseLossBackward>)
output :  tensor([[160450.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2634e+09, grad_fn=<MseLossBackward>)
output :  tensor([[53864.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(3475777.5000, grad_fn=<MseLossBackward>)
output :  tensor([[233246.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2812e+09, grad_fn=<MseLossBackward>)
output :  tensor([[202228.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1509404.2500, grad_fn=<MseLossBackward>)
output :  tensor([[186672.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2795845.2500, grad_fn=<MseLossBackward>)
output :  tensor([[106752.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(565621.5000, grad_fn=<MseLossBackward>)
output :  tensor([[89118.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(4489730.5000, grad_fn=<MseLossBackward>)
output :  tensor([[129233.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1591e+08, grad_fn=<MseLossBackward>)
output :  tensor([[222246.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1485e+09, grad_fn=<MseLossBackward>)
output :  tensor([[205688.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(3282155., grad_fn=<MseLossBackward>)
output :  tensor([[170425.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(29434694., grad_fn=<MseLossBackward>)
output :  tensor([[174584.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1750e+09, grad_fn=<MseLossBackward>)
output :  tensor([[189538.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(212895.7344, grad_fn=<MseLossBackward>)
output :  tensor([[87197.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(39163.7930, grad_fn=<MseLossBackward>)
output :  tensor([[136938.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(9371921., grad_fn=<MseLossBackward>)
output :  tensor([[113177.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(7168755., grad_fn=<MseLossBackward>)
output :  tensor([[149941.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9548e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174335.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8780e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194734.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0538e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180485.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(235528.2188, grad_fn=<MseLossBackward>)
output :  tensor([[97621.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(1258831.3750, grad_fn=<MseLossBackward>)
output :  tensor([[116241.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1582682., grad_fn=<MseLossBackward>)
output :  tensor([[161569.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0314e+08, grad_fn=<MseLossBackward>)
output :  tensor([[198804.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1429556.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145718.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2954585., grad_fn=<MseLossBackward>)
train_loss: [2.555683e+09]
epoch_result tensor([0.])
output :  tensor([[159651.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1327068., grad_fn=<MseLossBackward>)
output :  tensor([[119627.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(5628941.5000, grad_fn=<MseLossBackward>)
output :  tensor([[195912.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2930355.5000, grad_fn=<MseLossBackward>)
output :  tensor([[175750.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1562382.8750, grad_fn=<MseLossBackward>)
output :  tensor([[149224.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2804e+08, grad_fn=<MseLossBackward>)
output :  tensor([[124978.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(9129462., grad_fn=<MseLossBackward>)
output :  tensor([[141523.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(273888.6875, grad_fn=<MseLossBackward>)
output :  tensor([[119708.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(501773., grad_fn=<MseLossBackward>)
output :  tensor([[62402.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(15225909., grad_fn=<MseLossBackward>)
output :  tensor([[165856.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(20569.8340, grad_fn=<MseLossBackward>)
output :  tensor([[139822.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(31351.1289, grad_fn=<MseLossBackward>)
output :  tensor([[223627.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1883884.8750, grad_fn=<MseLossBackward>)
output :  tensor([[168339.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(436611.2188, grad_fn=<MseLossBackward>)
output :  tensor([[250438.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(544851.5625, grad_fn=<MseLossBackward>)
output :  tensor([[53034.9492]], grad_fn=<AddmmBackward>)
loss:  tensor(3861424.5000, grad_fn=<MseLossBackward>)
output :  tensor([[159793.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3390e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176564.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2447513.5000, grad_fn=<MseLossBackward>)
output :  tensor([[152978.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(12401843., grad_fn=<MseLossBackward>)
output :  tensor([[274731.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(72226.5625, grad_fn=<MseLossBackward>)
output :  tensor([[195690.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1713849.1250, grad_fn=<MseLossBackward>)
output :  tensor([[138027.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5335e+10, grad_fn=<MseLossBackward>)
output :  tensor([[195326.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2094125.5000, grad_fn=<MseLossBackward>)
output :  tensor([[180223.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9959e+09, grad_fn=<MseLossBackward>)
output :  tensor([[150111.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(788710.5000, grad_fn=<MseLossBackward>)
output :  tensor([[171946.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(3789835.5000, grad_fn=<MseLossBackward>)
output :  tensor([[84621.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(606621.9375, grad_fn=<MseLossBackward>)
output :  tensor([[170080.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2582e+09, grad_fn=<MseLossBackward>)
output :  tensor([[187162.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(4676879.5000, grad_fn=<MseLossBackward>)
output :  tensor([[211288.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9547e+09, grad_fn=<MseLossBackward>)
output :  tensor([[111792.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(3212608.2500, grad_fn=<MseLossBackward>)
output :  tensor([[170573.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(182075.5625, grad_fn=<MseLossBackward>)
output :  tensor([[135884.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(378628.6875, grad_fn=<MseLossBackward>)
output :  tensor([[130738.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(3023523.2500, grad_fn=<MseLossBackward>)
output :  tensor([[121678.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4744228.5000, grad_fn=<MseLossBackward>)
output :  tensor([[147077.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(9.0468e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165656.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2304e+10, grad_fn=<MseLossBackward>)
output :  tensor([[150328.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(394599.9062, grad_fn=<MseLossBackward>)
output :  tensor([[180399.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(159475.4375, grad_fn=<MseLossBackward>)
output :  tensor([[141951.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(904638.7500, grad_fn=<MseLossBackward>)
output :  tensor([[105235.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3211e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135843.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2657e+09, grad_fn=<MseLossBackward>)
output :  tensor([[133095.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(3627894., grad_fn=<MseLossBackward>)
output :  tensor([[131878.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(23795798., grad_fn=<MseLossBackward>)
output :  tensor([[223102.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(3600209.7500, grad_fn=<MseLossBackward>)
output :  tensor([[132125.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(15476.9150, grad_fn=<MseLossBackward>)
output :  tensor([[145423.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(12789341., grad_fn=<MseLossBackward>)
output :  tensor([[110333.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(2777717., grad_fn=<MseLossBackward>)
output :  tensor([[161930.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(3728580., grad_fn=<MseLossBackward>)
output :  tensor([[145522.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4481e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193792.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(3214008.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135350.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(811040.9375, grad_fn=<MseLossBackward>)
output :  tensor([[124346.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0581e+08, grad_fn=<MseLossBackward>)
output :  tensor([[234762.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(581477.7500, grad_fn=<MseLossBackward>)
output :  tensor([[167368.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1272e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157286.]], grad_fn=<AddmmBackward>)
loss:  tensor(2937796., grad_fn=<MseLossBackward>)
output :  tensor([[205260.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7969e+10, grad_fn=<MseLossBackward>)
output :  tensor([[248372.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1157e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144668.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1365903.5000, grad_fn=<MseLossBackward>)
output :  tensor([[132401.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2556401.2500, grad_fn=<MseLossBackward>)
output :  tensor([[155138.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(19195.2363, grad_fn=<MseLossBackward>)
output :  tensor([[135765.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(33239548., grad_fn=<MseLossBackward>)
output :  tensor([[179512.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4782e+09, grad_fn=<MseLossBackward>)
output :  tensor([[183471.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(395189.0312, grad_fn=<MseLossBackward>)
output :  tensor([[167032.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(30610630., grad_fn=<MseLossBackward>)
output :  tensor([[143303.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(92017.4297, grad_fn=<MseLossBackward>)
output :  tensor([[143516.]], grad_fn=<AddmmBackward>)
loss:  tensor(1032256., grad_fn=<MseLossBackward>)
output :  tensor([[141178.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(14603026., grad_fn=<MseLossBackward>)
output :  tensor([[173304.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4065e+09, grad_fn=<MseLossBackward>)
output :  tensor([[196147.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3483e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137164.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(441601.7812, grad_fn=<MseLossBackward>)
output :  tensor([[173002.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1216574.5000, grad_fn=<MseLossBackward>)
output :  tensor([[176111.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(23893002., grad_fn=<MseLossBackward>)
output :  tensor([[118011.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(9069273., grad_fn=<MseLossBackward>)
output :  tensor([[218493.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(6283325.5000, grad_fn=<MseLossBackward>)
output :  tensor([[186752.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(10578553., grad_fn=<MseLossBackward>)
output :  tensor([[125646.4922]], grad_fn=<AddmmBackward>)
loss:  tensor(21459.9609, grad_fn=<MseLossBackward>)
output :  tensor([[198333.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(3362467.2500, grad_fn=<MseLossBackward>)
output :  tensor([[176678.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(3164007.2500, grad_fn=<MseLossBackward>)
output :  tensor([[209215.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1341e+10, grad_fn=<MseLossBackward>)
output :  tensor([[208525.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(6123382., grad_fn=<MseLossBackward>)
output :  tensor([[163065.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0282e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192062.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(5943387., grad_fn=<MseLossBackward>)
output :  tensor([[113015.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(247.8165, grad_fn=<MseLossBackward>)
output :  tensor([[113875.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1892946., grad_fn=<MseLossBackward>)
output :  tensor([[112776.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(603158.5000, grad_fn=<MseLossBackward>)
output :  tensor([[147471.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(451080.1250, grad_fn=<MseLossBackward>)
output :  tensor([[161693.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2743e+10, grad_fn=<MseLossBackward>)
output :  tensor([[180868.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(754835.1875, grad_fn=<MseLossBackward>)
output :  tensor([[128840.4922]], grad_fn=<AddmmBackward>)
loss:  tensor(1796919.2500, grad_fn=<MseLossBackward>)
output :  tensor([[145635.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(403483., grad_fn=<MseLossBackward>)
output :  tensor([[185968.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6080e+09, grad_fn=<MseLossBackward>)
output :  tensor([[120163.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(10651911., grad_fn=<MseLossBackward>)
output :  tensor([[197208.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(43641.8203, grad_fn=<MseLossBackward>)
output :  tensor([[144652.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(120680.2500, grad_fn=<MseLossBackward>)
output :  tensor([[208703.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(17611924., grad_fn=<MseLossBackward>)
output :  tensor([[125554.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(198623.4219, grad_fn=<MseLossBackward>)
output :  tensor([[246371.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(3827097.5000, grad_fn=<MseLossBackward>)
output :  tensor([[237881.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2201e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145399.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9599e+08, grad_fn=<MseLossBackward>)
output :  tensor([[85191.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8522e+08, grad_fn=<MseLossBackward>)
output :  tensor([[197111.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0510e+09, grad_fn=<MseLossBackward>)
output :  tensor([[83601.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(6765892., grad_fn=<MseLossBackward>)
output :  tensor([[136448.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(9312034., grad_fn=<MseLossBackward>)
output :  tensor([[77650.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(4623104.5000, grad_fn=<MseLossBackward>)
output :  tensor([[143039.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(7457.9414, grad_fn=<MseLossBackward>)
output :  tensor([[176826.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(683412.2500, grad_fn=<MseLossBackward>)
output :  tensor([[153195.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(92767.8359, grad_fn=<MseLossBackward>)
output :  tensor([[107219.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(32447.8301, grad_fn=<MseLossBackward>)
output :  tensor([[206480.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1940e+10, grad_fn=<MseLossBackward>)
output :  tensor([[132161.]], grad_fn=<AddmmBackward>)
loss:  tensor(13402921., grad_fn=<MseLossBackward>)
output :  tensor([[267916.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4600e+08, grad_fn=<MseLossBackward>)
output :  tensor([[307543.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(6033010.5000, grad_fn=<MseLossBackward>)
output :  tensor([[107726.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(51454.5430, grad_fn=<MseLossBackward>)
output :  tensor([[169738.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(7623552.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135230.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4151e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130628.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(70074816., grad_fn=<MseLossBackward>)
output :  tensor([[124436.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(33798872., grad_fn=<MseLossBackward>)
output :  tensor([[128433.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(11787581., grad_fn=<MseLossBackward>)
output :  tensor([[134199.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1009e+08, grad_fn=<MseLossBackward>)
output :  tensor([[228183.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7954e+10, grad_fn=<MseLossBackward>)
output :  tensor([[191376.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2387e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144183.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(80310.2500, grad_fn=<MseLossBackward>)
output :  tensor([[129908.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(5802791.5000, grad_fn=<MseLossBackward>)
output :  tensor([[111615.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(133675.9219, grad_fn=<MseLossBackward>)
output :  tensor([[257386.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6814e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136708.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2919185.7500, grad_fn=<MseLossBackward>)
output :  tensor([[204066.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1137055.6250, grad_fn=<MseLossBackward>)
output :  tensor([[98262.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(44055992., grad_fn=<MseLossBackward>)
output :  tensor([[140566.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(380149.3125, grad_fn=<MseLossBackward>)
output :  tensor([[213800.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1448e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181141.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1540468.8750, grad_fn=<MseLossBackward>)
output :  tensor([[188379.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(11420915., grad_fn=<MseLossBackward>)
output :  tensor([[164059.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1008e+10, grad_fn=<MseLossBackward>)
output :  tensor([[300483.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1914e+09, grad_fn=<MseLossBackward>)
output :  tensor([[198844.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(892404.9375, grad_fn=<MseLossBackward>)
output :  tensor([[260135.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0371e+10, grad_fn=<MseLossBackward>)
output :  tensor([[222529.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8897e+09, grad_fn=<MseLossBackward>)
output :  tensor([[286999.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(9.0000e+08, grad_fn=<MseLossBackward>)
output :  tensor([[221500.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(6247812.5000, grad_fn=<MseLossBackward>)
output :  tensor([[223656.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8339e+10, grad_fn=<MseLossBackward>)
output :  tensor([[197608.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(370804.8750, grad_fn=<MseLossBackward>)
output :  tensor([[158668.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8025e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135485.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(8913583., grad_fn=<MseLossBackward>)
output :  tensor([[134683.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(666264.0625, grad_fn=<MseLossBackward>)
output :  tensor([[89311.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(2850847.5000, grad_fn=<MseLossBackward>)
output :  tensor([[105569.6328]], grad_fn=<AddmmBackward>)
loss:  tensor(5906684.5000, grad_fn=<MseLossBackward>)
output :  tensor([[274435.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9664e+09, grad_fn=<MseLossBackward>)
output :  tensor([[235994.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(988191.3125, grad_fn=<MseLossBackward>)
output :  tensor([[145261.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(68496.7031, grad_fn=<MseLossBackward>)
output :  tensor([[132759.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(22468636., grad_fn=<MseLossBackward>)
output :  tensor([[172764.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(937598.8125, grad_fn=<MseLossBackward>)
output :  tensor([[149305.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(16447587., grad_fn=<MseLossBackward>)
output :  tensor([[166134.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0459e+08, grad_fn=<MseLossBackward>)
output :  tensor([[164954.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2044.7354, grad_fn=<MseLossBackward>)
output :  tensor([[140079.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(9482454., grad_fn=<MseLossBackward>)
output :  tensor([[188785.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3937e+09, grad_fn=<MseLossBackward>)
output :  tensor([[112907.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(824237., grad_fn=<MseLossBackward>)
output :  tensor([[174871.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(8247576.5000, grad_fn=<MseLossBackward>)
output :  tensor([[119071.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(861633.5625, grad_fn=<MseLossBackward>)
output :  tensor([[86087.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(833397.8125, grad_fn=<MseLossBackward>)
output :  tensor([[180337.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(113821.8906, grad_fn=<MseLossBackward>)
output :  tensor([[111291.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(1937468.2500, grad_fn=<MseLossBackward>)
output :  tensor([[243272.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(18252120., grad_fn=<MseLossBackward>)
output :  tensor([[248056.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(9344198., grad_fn=<MseLossBackward>)
output :  tensor([[129137.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(131145.8281, grad_fn=<MseLossBackward>)
output :  tensor([[114618.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(32033036., grad_fn=<MseLossBackward>)
output :  tensor([[288047.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2233e+10, grad_fn=<MseLossBackward>)
output :  tensor([[173631.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(4541494., grad_fn=<MseLossBackward>)
output :  tensor([[123188.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(3280060.5000, grad_fn=<MseLossBackward>)
output :  tensor([[142470.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9881e+08, grad_fn=<MseLossBackward>)
output :  tensor([[202317.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3648e+08, grad_fn=<MseLossBackward>)
output :  tensor([[141069.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(4854.1699, grad_fn=<MseLossBackward>)
output :  tensor([[159360.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4554e+10, grad_fn=<MseLossBackward>)
output :  tensor([[152486.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1997584.7500, grad_fn=<MseLossBackward>)
output :  tensor([[129149.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(123151.6484, grad_fn=<MseLossBackward>)
output :  tensor([[249789.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6566e+10, grad_fn=<MseLossBackward>)
output :  tensor([[398387.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(13048124., grad_fn=<MseLossBackward>)
output :  tensor([[109732.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(536350.2500, grad_fn=<MseLossBackward>)
output :  tensor([[122849.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(18919578., grad_fn=<MseLossBackward>)
output :  tensor([[159408.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(8372.2500, grad_fn=<MseLossBackward>)
output :  tensor([[127832.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8475e+08, grad_fn=<MseLossBackward>)
output :  tensor([[162353.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5577e+09, grad_fn=<MseLossBackward>)
output :  tensor([[172290.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8801e+09, grad_fn=<MseLossBackward>)
output :  tensor([[104550.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(904386.1250, grad_fn=<MseLossBackward>)
output :  tensor([[139430.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2463477.5000, grad_fn=<MseLossBackward>)
output :  tensor([[360885.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(41064068., grad_fn=<MseLossBackward>)
output :  tensor([[207015.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2076e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174180.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1742028.7500, grad_fn=<MseLossBackward>)
output :  tensor([[208766.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(34413256., grad_fn=<MseLossBackward>)
output :  tensor([[141832.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(8023233.5000, grad_fn=<MseLossBackward>)
output :  tensor([[193723.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(603704.7500, grad_fn=<MseLossBackward>)
output :  tensor([[132831.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4169e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177774.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(10402238., grad_fn=<MseLossBackward>)
output :  tensor([[239047.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(8716703., grad_fn=<MseLossBackward>)
output :  tensor([[174389.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(151515.5625, grad_fn=<MseLossBackward>)
output :  tensor([[109960.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3842641.2500, grad_fn=<MseLossBackward>)
output :  tensor([[262848.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2931479., grad_fn=<MseLossBackward>)
output :  tensor([[251326.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1759685.1250, grad_fn=<MseLossBackward>)
output :  tensor([[124732.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3000798.2500, grad_fn=<MseLossBackward>)
output :  tensor([[214817.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6219e+09, grad_fn=<MseLossBackward>)
output :  tensor([[308080.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9651e+08, grad_fn=<MseLossBackward>)
output :  tensor([[208500.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2250047., grad_fn=<MseLossBackward>)
output :  tensor([[218564.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4747e+10, grad_fn=<MseLossBackward>)
output :  tensor([[159610.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2926612., grad_fn=<MseLossBackward>)
output :  tensor([[169588.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(161164.6094, grad_fn=<MseLossBackward>)
output :  tensor([[162116.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(26880498., grad_fn=<MseLossBackward>)
output :  tensor([[163107.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(47506772., grad_fn=<MseLossBackward>)
output :  tensor([[239374.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1942e+08, grad_fn=<MseLossBackward>)
output :  tensor([[226564.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(8358965., grad_fn=<MseLossBackward>)
output :  tensor([[161298.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0446e+08, grad_fn=<MseLossBackward>)
output :  tensor([[124020.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(1042265.5000, grad_fn=<MseLossBackward>)
output :  tensor([[175863.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1291880.8750, grad_fn=<MseLossBackward>)
output :  tensor([[181869.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1044e+09, grad_fn=<MseLossBackward>)
output :  tensor([[210507.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3896e+10, grad_fn=<MseLossBackward>)
output :  tensor([[132542.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(3570800.7500, grad_fn=<MseLossBackward>)
output :  tensor([[147111.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5083e+08, grad_fn=<MseLossBackward>)
output :  tensor([[274376.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(6884556., grad_fn=<MseLossBackward>)
output :  tensor([[86924.1016]], grad_fn=<AddmmBackward>)
loss:  tensor(3702166.7500, grad_fn=<MseLossBackward>)
output :  tensor([[234558.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3771000., grad_fn=<MseLossBackward>)
output :  tensor([[260914.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0370e+11, grad_fn=<MseLossBackward>)
output :  tensor([[169315.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(468518.8750, grad_fn=<MseLossBackward>)
output :  tensor([[196799.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4593e+09, grad_fn=<MseLossBackward>)
output :  tensor([[154270.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(532284.2500, grad_fn=<MseLossBackward>)
output :  tensor([[206875.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9847e+09, grad_fn=<MseLossBackward>)
output :  tensor([[130769.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3131019.7500, grad_fn=<MseLossBackward>)
output :  tensor([[148078.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(9474661., grad_fn=<MseLossBackward>)
output :  tensor([[169809.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4580e+08, grad_fn=<MseLossBackward>)
output :  tensor([[182969.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(8299891., grad_fn=<MseLossBackward>)
output :  tensor([[127297.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1683263., grad_fn=<MseLossBackward>)
output :  tensor([[138580.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(4329000.5000, grad_fn=<MseLossBackward>)
output :  tensor([[175566.]], grad_fn=<AddmmBackward>)
loss:  tensor(6584356., grad_fn=<MseLossBackward>)
output :  tensor([[199524.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5477e+09, grad_fn=<MseLossBackward>)
output :  tensor([[236016.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(48773200., grad_fn=<MseLossBackward>)
output :  tensor([[152210.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(7782705., grad_fn=<MseLossBackward>)
output :  tensor([[194740.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1587245.6250, grad_fn=<MseLossBackward>)
output :  tensor([[160636.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7679e+08, grad_fn=<MseLossBackward>)
output :  tensor([[184116.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(21308610., grad_fn=<MseLossBackward>)
output :  tensor([[179615.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(80913.5781, grad_fn=<MseLossBackward>)
output :  tensor([[96311.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(474086.0312, grad_fn=<MseLossBackward>)
output :  tensor([[173000.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1449e+10, grad_fn=<MseLossBackward>)
output :  tensor([[137089.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(4364378., grad_fn=<MseLossBackward>)
output :  tensor([[121091.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(37105992., grad_fn=<MseLossBackward>)
output :  tensor([[174225.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(50913.6914, grad_fn=<MseLossBackward>)
output :  tensor([[88796.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(14410328., grad_fn=<MseLossBackward>)
output :  tensor([[282987.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(49169460., grad_fn=<MseLossBackward>)
output :  tensor([[169161.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(17315352., grad_fn=<MseLossBackward>)
output :  tensor([[192791.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9706e+10, grad_fn=<MseLossBackward>)
output :  tensor([[250353.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2629e+08, grad_fn=<MseLossBackward>)
output :  tensor([[153299.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(5289856.5000, grad_fn=<MseLossBackward>)
output :  tensor([[122602.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1953006.2500, grad_fn=<MseLossBackward>)
output :  tensor([[125305.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(29224498., grad_fn=<MseLossBackward>)
output :  tensor([[145947.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(9.5776e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173491.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(258906.0625, grad_fn=<MseLossBackward>)
output :  tensor([[113261.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(9.4629e+08, grad_fn=<MseLossBackward>)
output :  tensor([[216693.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0263e+10, grad_fn=<MseLossBackward>)
output :  tensor([[238840.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(7074020.5000, grad_fn=<MseLossBackward>)
output :  tensor([[254465.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9804e+10, grad_fn=<MseLossBackward>)
output :  tensor([[222818.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6184e+08, grad_fn=<MseLossBackward>)
output :  tensor([[195931.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4297e+10, grad_fn=<MseLossBackward>)
output :  tensor([[189133.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2668016., grad_fn=<MseLossBackward>)
output :  tensor([[208011.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7028e+10, grad_fn=<MseLossBackward>)
output :  tensor([[192887.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0481e+10, grad_fn=<MseLossBackward>)
output :  tensor([[179140.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(160625.6094, grad_fn=<MseLossBackward>)
output :  tensor([[152396.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(157150.2969, grad_fn=<MseLossBackward>)
output :  tensor([[335354.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2708904.5000, grad_fn=<MseLossBackward>)
output :  tensor([[212639.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(409180.0938, grad_fn=<MseLossBackward>)
output :  tensor([[160904.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(817752.8125, grad_fn=<MseLossBackward>)
output :  tensor([[186926.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9783e+09, grad_fn=<MseLossBackward>)
output :  tensor([[110304.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(28137554., grad_fn=<MseLossBackward>)
output :  tensor([[277330.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7100e+10, grad_fn=<MseLossBackward>)
output :  tensor([[174716.]], grad_fn=<AddmmBackward>)
loss:  tensor(665856., grad_fn=<MseLossBackward>)
output :  tensor([[207689.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(33759732., grad_fn=<MseLossBackward>)
output :  tensor([[216354.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(21577042., grad_fn=<MseLossBackward>)
output :  tensor([[176720.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(6148695., grad_fn=<MseLossBackward>)
output :  tensor([[202670.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(756927.1875, grad_fn=<MseLossBackward>)
output :  tensor([[158711.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(13774420., grad_fn=<MseLossBackward>)
output :  tensor([[145106.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0346e+09, grad_fn=<MseLossBackward>)
output :  tensor([[120897.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(5749804.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138983.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1033049.8750, grad_fn=<MseLossBackward>)
output :  tensor([[149800.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(641000.3750, grad_fn=<MseLossBackward>)
output :  tensor([[200637.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6221e+10, grad_fn=<MseLossBackward>)
output :  tensor([[161336.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(3371068.2500, grad_fn=<MseLossBackward>)
output :  tensor([[101815.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(5361323., grad_fn=<MseLossBackward>)
output :  tensor([[226112.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9286e+08, grad_fn=<MseLossBackward>)
output :  tensor([[184364.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5586e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175690.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(630733.8125, grad_fn=<MseLossBackward>)
output :  tensor([[83369.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(1876193.6250, grad_fn=<MseLossBackward>)
output :  tensor([[130766.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(5135181., grad_fn=<MseLossBackward>)
output :  tensor([[217587.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(12867914., grad_fn=<MseLossBackward>)
output :  tensor([[143538.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(213054.3594, grad_fn=<MseLossBackward>)
output :  tensor([[133825.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(14632298., grad_fn=<MseLossBackward>)
output :  tensor([[142528.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(5105.5488, grad_fn=<MseLossBackward>)
output :  tensor([[174357.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3585e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145188.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1412532.2500, grad_fn=<MseLossBackward>)
output :  tensor([[159590.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(167818.2500, grad_fn=<MseLossBackward>)
output :  tensor([[212973.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(4107335.5000, grad_fn=<MseLossBackward>)
output :  tensor([[133594.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1762e+08, grad_fn=<MseLossBackward>)
output :  tensor([[255320.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(102630.1328, grad_fn=<MseLossBackward>)
output :  tensor([[159257.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(58919.9766, grad_fn=<MseLossBackward>)
output :  tensor([[129721.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1490879.1250, grad_fn=<MseLossBackward>)
output :  tensor([[95266.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(71068.0625, grad_fn=<MseLossBackward>)
output :  tensor([[151791.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5281e+09, grad_fn=<MseLossBackward>)
output :  tensor([[179346.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(305860.8438, grad_fn=<MseLossBackward>)
output :  tensor([[119382.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1248142.8750, grad_fn=<MseLossBackward>)
output :  tensor([[190207.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5010e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145732.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3867e+09, grad_fn=<MseLossBackward>)
output :  tensor([[148388.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2284112.7500, grad_fn=<MseLossBackward>)
output :  tensor([[188296.]], grad_fn=<AddmmBackward>)
loss:  tensor(298116., grad_fn=<MseLossBackward>)
output :  tensor([[253092.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5987e+09, grad_fn=<MseLossBackward>)
output :  tensor([[93777.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(5187397.5000, grad_fn=<MseLossBackward>)
output :  tensor([[238108.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(3577535.7500, grad_fn=<MseLossBackward>)
output :  tensor([[124626.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(15007331., grad_fn=<MseLossBackward>)
output :  tensor([[166326.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9148e+09, grad_fn=<MseLossBackward>)
output :  tensor([[114138.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9989e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179598.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(12949877., grad_fn=<MseLossBackward>)
output :  tensor([[162951.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5469e+08, grad_fn=<MseLossBackward>)
output :  tensor([[154440.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7313e+08, grad_fn=<MseLossBackward>)
output :  tensor([[236846.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(4636956.5000, grad_fn=<MseLossBackward>)
output :  tensor([[221997.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2961e+09, grad_fn=<MseLossBackward>)
output :  tensor([[126552.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(200389.1250, grad_fn=<MseLossBackward>)
output :  tensor([[127617.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(2617191., grad_fn=<MseLossBackward>)
output :  tensor([[225013.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(3946492.7500, grad_fn=<MseLossBackward>)
output :  tensor([[226768.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(52300244., grad_fn=<MseLossBackward>)
output :  tensor([[232798.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(37186936., grad_fn=<MseLossBackward>)
output :  tensor([[147872.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(16372.0020, grad_fn=<MseLossBackward>)
output :  tensor([[215137.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(26397920., grad_fn=<MseLossBackward>)
output :  tensor([[132688.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6100e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137740.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(27463660., grad_fn=<MseLossBackward>)
output :  tensor([[311711.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(10813821., grad_fn=<MseLossBackward>)
output :  tensor([[137044.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(15643385., grad_fn=<MseLossBackward>)
output :  tensor([[122024.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0276e+09, grad_fn=<MseLossBackward>)
output :  tensor([[108899.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(360187.5312, grad_fn=<MseLossBackward>)
output :  tensor([[157182.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3464e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181507.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(8.6895e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174319.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1742193.7500, grad_fn=<MseLossBackward>)
output :  tensor([[195361.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(31796382., grad_fn=<MseLossBackward>)
output :  tensor([[103403.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(11586737., grad_fn=<MseLossBackward>)
output :  tensor([[179428.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(183906.9688, grad_fn=<MseLossBackward>)
output :  tensor([[166537.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1855682.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138955.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1944.2588, grad_fn=<MseLossBackward>)
output :  tensor([[262448.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(9.3415e+09, grad_fn=<MseLossBackward>)
output :  tensor([[142157.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2670e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173724.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(524470.1875, grad_fn=<MseLossBackward>)
output :  tensor([[139859.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(19613.1270, grad_fn=<MseLossBackward>)
output :  tensor([[197581.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(8516639., grad_fn=<MseLossBackward>)
output :  tensor([[169523.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(226992.6875, grad_fn=<MseLossBackward>)
output :  tensor([[244099.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(9872.2852, grad_fn=<MseLossBackward>)
output :  tensor([[133457.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1087686., grad_fn=<MseLossBackward>)
output :  tensor([[150699.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1820349.1250, grad_fn=<MseLossBackward>)
output :  tensor([[212628.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(5623790., grad_fn=<MseLossBackward>)
output :  tensor([[164510.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(239319.7031, grad_fn=<MseLossBackward>)
output :  tensor([[186565.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(5927399., grad_fn=<MseLossBackward>)
output :  tensor([[134590.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9583e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128163.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(700464.3750, grad_fn=<MseLossBackward>)
output :  tensor([[139333.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(444763.9375, grad_fn=<MseLossBackward>)
output :  tensor([[204260.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2562e+09, grad_fn=<MseLossBackward>)
output :  tensor([[165202.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5203e+09, grad_fn=<MseLossBackward>)
output :  tensor([[71560.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3365e+08, grad_fn=<MseLossBackward>)
output :  tensor([[94767.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0542e+08, grad_fn=<MseLossBackward>)
output :  tensor([[248828.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(19934412., grad_fn=<MseLossBackward>)
output :  tensor([[204767.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3254e+09, grad_fn=<MseLossBackward>)
output :  tensor([[112369.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(6920886.5000, grad_fn=<MseLossBackward>)
output :  tensor([[161202.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9157e+08, grad_fn=<MseLossBackward>)
output :  tensor([[207569.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5452e+08, grad_fn=<MseLossBackward>)
output :  tensor([[183181.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5375e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159052.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(16424276., grad_fn=<MseLossBackward>)
output :  tensor([[169148.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(725424.8125, grad_fn=<MseLossBackward>)
output :  tensor([[114337.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(439310.0625, grad_fn=<MseLossBackward>)
output :  tensor([[160748.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(33045612., grad_fn=<MseLossBackward>)
output :  tensor([[193171.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8846e+08, grad_fn=<MseLossBackward>)
output :  tensor([[215004.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(20213454., grad_fn=<MseLossBackward>)
output :  tensor([[246440.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4856e+11, grad_fn=<MseLossBackward>)
output :  tensor([[148511.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2285860.5000, grad_fn=<MseLossBackward>)
output :  tensor([[107946.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(284763.9688, grad_fn=<MseLossBackward>)
output :  tensor([[171243.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1356e+08, grad_fn=<MseLossBackward>)
output :  tensor([[155348.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(23505074., grad_fn=<MseLossBackward>)
output :  tensor([[234107.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(8364568., grad_fn=<MseLossBackward>)
output :  tensor([[115939.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(881750.3750, grad_fn=<MseLossBackward>)
output :  tensor([[178809.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(16728228., grad_fn=<MseLossBackward>)
output :  tensor([[188731.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(4126928.7500, grad_fn=<MseLossBackward>)
output :  tensor([[164674.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4126e+10, grad_fn=<MseLossBackward>)
output :  tensor([[92380.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2952e+08, grad_fn=<MseLossBackward>)
output :  tensor([[234389.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(21253252., grad_fn=<MseLossBackward>)
output :  tensor([[176953.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(909609.2500, grad_fn=<MseLossBackward>)
output :  tensor([[140195.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(38238.5820, grad_fn=<MseLossBackward>)
output :  tensor([[239129.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(17056642., grad_fn=<MseLossBackward>)
output :  tensor([[161770.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1510978.7500, grad_fn=<MseLossBackward>)
output :  tensor([[207046.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3913e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134074.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(856897.3750, grad_fn=<MseLossBackward>)
output :  tensor([[186971.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2357e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134439.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2435745.5000, grad_fn=<MseLossBackward>)
output :  tensor([[228829.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(51421224., grad_fn=<MseLossBackward>)
output :  tensor([[227033.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2746e+08, grad_fn=<MseLossBackward>)
output :  tensor([[90151.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(23011.4688, grad_fn=<MseLossBackward>)
output :  tensor([[160455.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1043047.3125, grad_fn=<MseLossBackward>)
output :  tensor([[247981.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5103e+10, grad_fn=<MseLossBackward>)
output :  tensor([[147831.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(8018896.5000, grad_fn=<MseLossBackward>)
output :  tensor([[110316.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8763e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163900.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(359306.5938, grad_fn=<MseLossBackward>)
output :  tensor([[142898.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1213990.7500, grad_fn=<MseLossBackward>)
output :  tensor([[128027.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(29699.6758, grad_fn=<MseLossBackward>)
output :  tensor([[187931.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0508e+09, grad_fn=<MseLossBackward>)
output :  tensor([[120677.4922]], grad_fn=<AddmmBackward>)
loss:  tensor(3321534.7500, grad_fn=<MseLossBackward>)
output :  tensor([[154077.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(4315227., grad_fn=<MseLossBackward>)
output :  tensor([[172074.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(105219.1406, grad_fn=<MseLossBackward>)
output :  tensor([[148174.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(7984421.5000, grad_fn=<MseLossBackward>)
output :  tensor([[166809.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(15284068., grad_fn=<MseLossBackward>)
output :  tensor([[138623.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7756e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134954.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(8727962., grad_fn=<MseLossBackward>)
output :  tensor([[154429.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3806e+08, grad_fn=<MseLossBackward>)
output :  tensor([[147317.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(10020093., grad_fn=<MseLossBackward>)
output :  tensor([[164508.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(7608632.5000, grad_fn=<MseLossBackward>)
output :  tensor([[134310.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9585e+08, grad_fn=<MseLossBackward>)
output :  tensor([[149773.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(948158.6250, grad_fn=<MseLossBackward>)
output :  tensor([[185033.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(8801606., grad_fn=<MseLossBackward>)
output :  tensor([[172122.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(9751568., grad_fn=<MseLossBackward>)
output :  tensor([[178693.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1706370.7500, grad_fn=<MseLossBackward>)
output :  tensor([[219058.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(886745.9375, grad_fn=<MseLossBackward>)
output :  tensor([[111884.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(15874435., grad_fn=<MseLossBackward>)
output :  tensor([[134022.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(83212024., grad_fn=<MseLossBackward>)
output :  tensor([[287495.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2235585.7500, grad_fn=<MseLossBackward>)
output :  tensor([[118297.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(5280193.5000, grad_fn=<MseLossBackward>)
output :  tensor([[179876.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6099e+09, grad_fn=<MseLossBackward>)
output :  tensor([[185480.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(230700.0938, grad_fn=<MseLossBackward>)
output :  tensor([[173436.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4554e+08, grad_fn=<MseLossBackward>)
output :  tensor([[250702.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9038e+08, grad_fn=<MseLossBackward>)
output :  tensor([[221869.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(17087.3906, grad_fn=<MseLossBackward>)
output :  tensor([[122726.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8312e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174495.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6207e+08, grad_fn=<MseLossBackward>)
output :  tensor([[122951.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1099647.1250, grad_fn=<MseLossBackward>)
output :  tensor([[183768.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5031e+10, grad_fn=<MseLossBackward>)
output :  tensor([[151063.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3749911.2500, grad_fn=<MseLossBackward>)
output :  tensor([[155047.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(73063760., grad_fn=<MseLossBackward>)
output :  tensor([[205628.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(450534.6250, grad_fn=<MseLossBackward>)
output :  tensor([[145845.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7809e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175873.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(15903.5742, grad_fn=<MseLossBackward>)
output :  tensor([[251518.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8294e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148420.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(176702., grad_fn=<MseLossBackward>)
output :  tensor([[204211.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2390212.7500, grad_fn=<MseLossBackward>)
output :  tensor([[162570.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(6869313.5000, grad_fn=<MseLossBackward>)
output :  tensor([[123739.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2773e+09, grad_fn=<MseLossBackward>)
output :  tensor([[139120.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(11359217., grad_fn=<MseLossBackward>)
output :  tensor([[181868.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4541427.5000, grad_fn=<MseLossBackward>)
output :  tensor([[198975.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(80556512., grad_fn=<MseLossBackward>)
output :  tensor([[239462.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4539e+09, grad_fn=<MseLossBackward>)
output :  tensor([[253327.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(13490814., grad_fn=<MseLossBackward>)
output :  tensor([[191613.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6227e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145189.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8826e+09, grad_fn=<MseLossBackward>)
output :  tensor([[142987.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2286569.2500, grad_fn=<MseLossBackward>)
output :  tensor([[73007.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0895e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144181.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(84306256., grad_fn=<MseLossBackward>)
output :  tensor([[130633.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(3004941., grad_fn=<MseLossBackward>)
output :  tensor([[156326.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(5410421.5000, grad_fn=<MseLossBackward>)
output :  tensor([[127977.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(955903.3750, grad_fn=<MseLossBackward>)
output :  tensor([[77924.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2028087.5000, grad_fn=<MseLossBackward>)
output :  tensor([[81292.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(500357.2812, grad_fn=<MseLossBackward>)
output :  tensor([[223034.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(80382992., grad_fn=<MseLossBackward>)
output :  tensor([[141753.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5576e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128767.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(3001421., grad_fn=<MseLossBackward>)
output :  tensor([[171376.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(19151564., grad_fn=<MseLossBackward>)
output :  tensor([[236884.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(3550103.7500, grad_fn=<MseLossBackward>)
output :  tensor([[193213.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1152301.6250, grad_fn=<MseLossBackward>)
output :  tensor([[156991.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(983382.1250, grad_fn=<MseLossBackward>)
output :  tensor([[195971.]], grad_fn=<AddmmBackward>)
loss:  tensor(3721041., grad_fn=<MseLossBackward>)
output :  tensor([[205176.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0127e+09, grad_fn=<MseLossBackward>)
output :  tensor([[135891.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1229326.5000, grad_fn=<MseLossBackward>)
output :  tensor([[154825.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(30575.8008, grad_fn=<MseLossBackward>)
output :  tensor([[136352.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(124443.5859, grad_fn=<MseLossBackward>)
output :  tensor([[203426.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0613e+08, grad_fn=<MseLossBackward>)
output :  tensor([[155370.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1878355.8750, grad_fn=<MseLossBackward>)
output :  tensor([[136850.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8793e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145858.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(918033.4375, grad_fn=<MseLossBackward>)
output :  tensor([[209539.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(6053522., grad_fn=<MseLossBackward>)
output :  tensor([[98956.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8752e+08, grad_fn=<MseLossBackward>)
output :  tensor([[167282.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(47428.6719, grad_fn=<MseLossBackward>)
output :  tensor([[126899.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(1211805.3750, grad_fn=<MseLossBackward>)
output :  tensor([[146622.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(142671.4531, grad_fn=<MseLossBackward>)
output :  tensor([[101533.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5327e+09, grad_fn=<MseLossBackward>)
output :  tensor([[134121.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(11416902., grad_fn=<MseLossBackward>)
output :  tensor([[237246.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1553489.6250, grad_fn=<MseLossBackward>)
output :  tensor([[146891.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(3577122., grad_fn=<MseLossBackward>)
output :  tensor([[138148.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(420066., grad_fn=<MseLossBackward>)
output :  tensor([[164823.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3560e+09, grad_fn=<MseLossBackward>)
output :  tensor([[272635.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(28774842., grad_fn=<MseLossBackward>)
output :  tensor([[176983.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3934148.2500, grad_fn=<MseLossBackward>)
output :  tensor([[102494.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(79026.8750, grad_fn=<MseLossBackward>)
output :  tensor([[204353.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3504e+09, grad_fn=<MseLossBackward>)
output :  tensor([[160289.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1662326.7500, grad_fn=<MseLossBackward>)
output :  tensor([[162042.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6390e+10, grad_fn=<MseLossBackward>)
output :  tensor([[102081.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(14302460., grad_fn=<MseLossBackward>)
output :  tensor([[122569.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(1062171.7500, grad_fn=<MseLossBackward>)
output :  tensor([[156615.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(379302., grad_fn=<MseLossBackward>)
output :  tensor([[138696.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1700212.2500, grad_fn=<MseLossBackward>)
output :  tensor([[201295.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1678968., grad_fn=<MseLossBackward>)
output :  tensor([[141522.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(228185.3438, grad_fn=<MseLossBackward>)
output :  tensor([[260295.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(3936442., grad_fn=<MseLossBackward>)
output :  tensor([[127952.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2217e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166712.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1470194.1250, grad_fn=<MseLossBackward>)
output :  tensor([[192318.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(14579033., grad_fn=<MseLossBackward>)
output :  tensor([[123927.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9397e+08, grad_fn=<MseLossBackward>)
output :  tensor([[251471.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2165220.2500, grad_fn=<MseLossBackward>)
output :  tensor([[157761.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5489e+08, grad_fn=<MseLossBackward>)
output :  tensor([[244249.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1211134.6250, grad_fn=<MseLossBackward>)
output :  tensor([[144914.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(836081.6250, grad_fn=<MseLossBackward>)
output :  tensor([[208693.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1708208.1250, grad_fn=<MseLossBackward>)
output :  tensor([[177228.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(23315468., grad_fn=<MseLossBackward>)
output :  tensor([[151564.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(5933563., grad_fn=<MseLossBackward>)
output :  tensor([[113241.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(22641018., grad_fn=<MseLossBackward>)
output :  tensor([[238101.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3999e+09, grad_fn=<MseLossBackward>)
output :  tensor([[238527.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2167014., grad_fn=<MseLossBackward>)
output :  tensor([[155485.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(4617328., grad_fn=<MseLossBackward>)
output :  tensor([[256410.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2282885., grad_fn=<MseLossBackward>)
output :  tensor([[124400.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(97939472., grad_fn=<MseLossBackward>)
output :  tensor([[178233.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(4990407., grad_fn=<MseLossBackward>)
output :  tensor([[160711.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(505587.6562, grad_fn=<MseLossBackward>)
output :  tensor([[131160.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(25845.5859, grad_fn=<MseLossBackward>)
output :  tensor([[192513.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9708e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163531.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(219433.6875, grad_fn=<MseLossBackward>)
output :  tensor([[165397.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(5749804.5000, grad_fn=<MseLossBackward>)
output :  tensor([[158801.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(642928.3125, grad_fn=<MseLossBackward>)
output :  tensor([[157266.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(54259796., grad_fn=<MseLossBackward>)
output :  tensor([[171848.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8873e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161824.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3329256.5000, grad_fn=<MseLossBackward>)
output :  tensor([[378783.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(26904320., grad_fn=<MseLossBackward>)
output :  tensor([[125876.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(1261673., grad_fn=<MseLossBackward>)
output :  tensor([[128527.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8514e+09, grad_fn=<MseLossBackward>)
output :  tensor([[282507.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1675164., grad_fn=<MseLossBackward>)
output :  tensor([[164573.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(6623787., grad_fn=<MseLossBackward>)
output :  tensor([[128259.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(60213840., grad_fn=<MseLossBackward>)
output :  tensor([[233961.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(3846869.2500, grad_fn=<MseLossBackward>)
output :  tensor([[180638.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(19238.5566, grad_fn=<MseLossBackward>)
output :  tensor([[151312.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(472377., grad_fn=<MseLossBackward>)
output :  tensor([[144107.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(796807.3125, grad_fn=<MseLossBackward>)
output :  tensor([[154947.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2572e+08, grad_fn=<MseLossBackward>)
output :  tensor([[99572.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(182569.2656, grad_fn=<MseLossBackward>)
output :  tensor([[72583.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5834e+08, grad_fn=<MseLossBackward>)
output :  tensor([[167609.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(6808348.5000, grad_fn=<MseLossBackward>)
output :  tensor([[189083.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5145e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158538.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(290116.8750, grad_fn=<MseLossBackward>)
output :  tensor([[160274.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(7700538.5000, grad_fn=<MseLossBackward>)
output :  tensor([[136658.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(626274.3750, grad_fn=<MseLossBackward>)
output :  tensor([[209158.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(10296578., grad_fn=<MseLossBackward>)
output :  tensor([[137474.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(275854.7500, grad_fn=<MseLossBackward>)
output :  tensor([[182247.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6321e+10, grad_fn=<MseLossBackward>)
output :  tensor([[146999.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(999593.8125, grad_fn=<MseLossBackward>)
output :  tensor([[108942.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7303e+08, grad_fn=<MseLossBackward>)
output :  tensor([[96047.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(4193952., grad_fn=<MseLossBackward>)
output :  tensor([[176853.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(3434246., grad_fn=<MseLossBackward>)
output :  tensor([[264122.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(13860496., grad_fn=<MseLossBackward>)
output :  tensor([[141183.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(99865.8750, grad_fn=<MseLossBackward>)
output :  tensor([[158070.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(3328458.2500, grad_fn=<MseLossBackward>)
output :  tensor([[132709.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(43916.4414, grad_fn=<MseLossBackward>)
output :  tensor([[147123.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(5646638.5000, grad_fn=<MseLossBackward>)
output :  tensor([[165928.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(3885765., grad_fn=<MseLossBackward>)
output :  tensor([[127310.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(96381.1406, grad_fn=<MseLossBackward>)
output :  tensor([[172261.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4319e+08, grad_fn=<MseLossBackward>)
output :  tensor([[157854.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(729956.6250, grad_fn=<MseLossBackward>)
output :  tensor([[115797.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(493901.5000, grad_fn=<MseLossBackward>)
output :  tensor([[158650.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5279e+09, grad_fn=<MseLossBackward>)
output :  tensor([[50130.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(3494650.5000, grad_fn=<MseLossBackward>)
output :  tensor([[230525.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7199e+09, grad_fn=<MseLossBackward>)
output :  tensor([[200185.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(663003.0625, grad_fn=<MseLossBackward>)
output :  tensor([[182168.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(8019958.5000, grad_fn=<MseLossBackward>)
output :  tensor([[106722.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(522604.7500, grad_fn=<MseLossBackward>)
output :  tensor([[88049.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1101876.6250, grad_fn=<MseLossBackward>)
output :  tensor([[137711.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(5236088., grad_fn=<MseLossBackward>)
output :  tensor([[223543.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9641e+09, grad_fn=<MseLossBackward>)
output :  tensor([[206469.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1062220.1250, grad_fn=<MseLossBackward>)
output :  tensor([[165594.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(352928.8125, grad_fn=<MseLossBackward>)
output :  tensor([[174954.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1082e+09, grad_fn=<MseLossBackward>)
output :  tensor([[191583.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2506977.5000, grad_fn=<MseLossBackward>)
output :  tensor([[90837.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(14726646., grad_fn=<MseLossBackward>)
output :  tensor([[138661.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1792795.5000, grad_fn=<MseLossBackward>)
output :  tensor([[111516.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1033748.8125, grad_fn=<MseLossBackward>)
output :  tensor([[148238.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5077e+08, grad_fn=<MseLossBackward>)
output :  tensor([[171976.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6791e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195003.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(99920640., grad_fn=<MseLossBackward>)
output :  tensor([[178944.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1114146.2500, grad_fn=<MseLossBackward>)
output :  tensor([[95449.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(1103862.1250, grad_fn=<MseLossBackward>)
output :  tensor([[118276.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(603279.8750, grad_fn=<MseLossBackward>)
output :  tensor([[160967.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3051e+08, grad_fn=<MseLossBackward>)
output :  tensor([[203236.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(10475741., grad_fn=<MseLossBackward>)
output :  tensor([[144797.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(635283.7500, grad_fn=<MseLossBackward>)
train_loss: [2.5546486e+09]
epoch_result tensor([0.])
output :  tensor([[155202.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(10874331., grad_fn=<MseLossBackward>)
output :  tensor([[123597.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(2551332.2500, grad_fn=<MseLossBackward>)
output :  tensor([[195848.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2713226.7500, grad_fn=<MseLossBackward>)
output :  tensor([[178429.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2042666.2500, grad_fn=<MseLossBackward>)
output :  tensor([[152164.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6746e+08, grad_fn=<MseLossBackward>)
output :  tensor([[127676.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(104874.7734, grad_fn=<MseLossBackward>)
output :  tensor([[139155.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(3402238., grad_fn=<MseLossBackward>)
output :  tensor([[120492.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(2227299.7500, grad_fn=<MseLossBackward>)
output :  tensor([[64291.2773]], grad_fn=<AddmmBackward>)
loss:  tensor(33538894., grad_fn=<MseLossBackward>)
output :  tensor([[166307.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(94508.2109, grad_fn=<MseLossBackward>)
output :  tensor([[150242.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0491e+08, grad_fn=<MseLossBackward>)
output :  tensor([[224890.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(12075.9492, grad_fn=<MseLossBackward>)
output :  tensor([[169268.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(72008.3672, grad_fn=<MseLossBackward>)
output :  tensor([[245666.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(16267106., grad_fn=<MseLossBackward>)
output :  tensor([[55276.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(76201.8750, grad_fn=<MseLossBackward>)
output :  tensor([[158780.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0393e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165347.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(93164720., grad_fn=<MseLossBackward>)
output :  tensor([[168364.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4076e+08, grad_fn=<MseLossBackward>)
output :  tensor([[276163.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1352787.1250, grad_fn=<MseLossBackward>)
output :  tensor([[197108.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(11718.0625, grad_fn=<MseLossBackward>)
output :  tensor([[138650.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4993e+10, grad_fn=<MseLossBackward>)
output :  tensor([[195932.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(4217632.5000, grad_fn=<MseLossBackward>)
output :  tensor([[179264.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0826e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151544.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(296055., grad_fn=<MseLossBackward>)
output :  tensor([[164789.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(27154032., grad_fn=<MseLossBackward>)
output :  tensor([[89124.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(13868816., grad_fn=<MseLossBackward>)
output :  tensor([[171170.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3838e+09, grad_fn=<MseLossBackward>)
output :  tensor([[186826.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3336216.5000, grad_fn=<MseLossBackward>)
output :  tensor([[208471.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2117e+09, grad_fn=<MseLossBackward>)
output :  tensor([[110538.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(289460.8125, grad_fn=<MseLossBackward>)
output :  tensor([[172136.]], grad_fn=<AddmmBackward>)
loss:  tensor(1290496., grad_fn=<MseLossBackward>)
output :  tensor([[138385.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(3555640.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128575.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(179882.0156, grad_fn=<MseLossBackward>)
output :  tensor([[121172.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2796524.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144658.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6500e+08, grad_fn=<MseLossBackward>)
output :  tensor([[169803.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1082e+10, grad_fn=<MseLossBackward>)
output :  tensor([[148323.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1894021., grad_fn=<MseLossBackward>)
output :  tensor([[178930.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1143930.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138112.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(8336032., grad_fn=<MseLossBackward>)
output :  tensor([[104696.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1598e+08, grad_fn=<MseLossBackward>)
output :  tensor([[132747.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7655e+09, grad_fn=<MseLossBackward>)
output :  tensor([[138919.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(15364195., grad_fn=<MseLossBackward>)
output :  tensor([[132127.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(26288692., grad_fn=<MseLossBackward>)
output :  tensor([[220590.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(19440522., grad_fn=<MseLossBackward>)
output :  tensor([[132915.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(442827.8750, grad_fn=<MseLossBackward>)
output :  tensor([[150535.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2358960., grad_fn=<MseLossBackward>)
output :  tensor([[112816.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(666404.3750, grad_fn=<MseLossBackward>)
output :  tensor([[160741.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(549683.2500, grad_fn=<MseLossBackward>)
output :  tensor([[145570.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4433e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193876.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3520431.2500, grad_fn=<MseLossBackward>)
output :  tensor([[134251.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(39352.6406, grad_fn=<MseLossBackward>)
output :  tensor([[112186.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(4781397., grad_fn=<MseLossBackward>)
output :  tensor([[231938.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(4248172., grad_fn=<MseLossBackward>)
output :  tensor([[167127.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1495e+09, grad_fn=<MseLossBackward>)
output :  tensor([[162377.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(11410462., grad_fn=<MseLossBackward>)
output :  tensor([[203424.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8587e+10, grad_fn=<MseLossBackward>)
output :  tensor([[248871.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1052e+10, grad_fn=<MseLossBackward>)
output :  tensor([[140132.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(11343108., grad_fn=<MseLossBackward>)
output :  tensor([[138392.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(19294606., grad_fn=<MseLossBackward>)
output :  tensor([[153435.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2448638.2500, grad_fn=<MseLossBackward>)
output :  tensor([[134881.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(23826602., grad_fn=<MseLossBackward>)
output :  tensor([[180408.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3347e+09, grad_fn=<MseLossBackward>)
output :  tensor([[181550.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(6499472., grad_fn=<MseLossBackward>)
output :  tensor([[159772.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2985444., grad_fn=<MseLossBackward>)
output :  tensor([[133152.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(96964336., grad_fn=<MseLossBackward>)
output :  tensor([[143226.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(528301.8125, grad_fn=<MseLossBackward>)
output :  tensor([[145224.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(50603.9102, grad_fn=<MseLossBackward>)
output :  tensor([[173576.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3705e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195490.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6265e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137918.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2013383.6250, grad_fn=<MseLossBackward>)
output :  tensor([[172530.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(397372.6250, grad_fn=<MseLossBackward>)
output :  tensor([[182148.]], grad_fn=<AddmmBackward>)
loss:  tensor(1317904., grad_fn=<MseLossBackward>)
output :  tensor([[117458.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(6044491., grad_fn=<MseLossBackward>)
output :  tensor([[218912.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(4357004., grad_fn=<MseLossBackward>)
output :  tensor([[179843.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(13368735., grad_fn=<MseLossBackward>)
output :  tensor([[127662.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(4674480.5000, grad_fn=<MseLossBackward>)
output :  tensor([[197176.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(457863.6875, grad_fn=<MseLossBackward>)
output :  tensor([[171668.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(10442289., grad_fn=<MseLossBackward>)
output :  tensor([[213155.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9962e+10, grad_fn=<MseLossBackward>)
output :  tensor([[208698.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(5296399., grad_fn=<MseLossBackward>)
output :  tensor([[163676.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0677e+09, grad_fn=<MseLossBackward>)
output :  tensor([[196248.]], grad_fn=<AddmmBackward>)
loss:  tensor(3055504., grad_fn=<MseLossBackward>)
output :  tensor([[110797.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(4849939.5000, grad_fn=<MseLossBackward>)
output :  tensor([[116866.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(19067140., grad_fn=<MseLossBackward>)
output :  tensor([[110900.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(1209879.7500, grad_fn=<MseLossBackward>)
output :  tensor([[145590.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1462474.5000, grad_fn=<MseLossBackward>)
output :  tensor([[161805.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2702e+10, grad_fn=<MseLossBackward>)
output :  tensor([[177856.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4596200., grad_fn=<MseLossBackward>)
output :  tensor([[128540.1016]], grad_fn=<AddmmBackward>)
loss:  tensor(1081811.2500, grad_fn=<MseLossBackward>)
output :  tensor([[142320.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(7181981.5000, grad_fn=<MseLossBackward>)
output :  tensor([[178095.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8659e+09, grad_fn=<MseLossBackward>)
output :  tensor([[117677.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(604336.1875, grad_fn=<MseLossBackward>)
output :  tensor([[199696.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(7270522.5000, grad_fn=<MseLossBackward>)
output :  tensor([[149199.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(17633438., grad_fn=<MseLossBackward>)
output :  tensor([[209975.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(8551878., grad_fn=<MseLossBackward>)
output :  tensor([[129690.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(13619560., grad_fn=<MseLossBackward>)
output :  tensor([[247004.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1750618.3750, grad_fn=<MseLossBackward>)
output :  tensor([[241757.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8699e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146361.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2385e+08, grad_fn=<MseLossBackward>)
output :  tensor([[86444.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4743e+08, grad_fn=<MseLossBackward>)
output :  tensor([[194108.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5273e+09, grad_fn=<MseLossBackward>)
output :  tensor([[80989.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(106.3477, grad_fn=<MseLossBackward>)
output :  tensor([[139252.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(61380.0625, grad_fn=<MseLossBackward>)
output :  tensor([[76031.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(282807.9062, grad_fn=<MseLossBackward>)
output :  tensor([[143566.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(376593.1562, grad_fn=<MseLossBackward>)
output :  tensor([[176008.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(79.8789, grad_fn=<MseLossBackward>)
output :  tensor([[152953.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(298525.6250, grad_fn=<MseLossBackward>)
output :  tensor([[110237.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(8052027., grad_fn=<MseLossBackward>)
output :  tensor([[206525.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1930e+10, grad_fn=<MseLossBackward>)
output :  tensor([[125147.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(11239675., grad_fn=<MseLossBackward>)
output :  tensor([[269813.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0376e+08, grad_fn=<MseLossBackward>)
output :  tensor([[301998.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(64025504., grad_fn=<MseLossBackward>)
output :  tensor([[107509.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(95.6729, grad_fn=<MseLossBackward>)
output :  tensor([[169812.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(7220892.5000, grad_fn=<MseLossBackward>)
output :  tensor([[133974.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(6.7467e+08, grad_fn=<MseLossBackward>)
output :  tensor([[142273.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(10714472., grad_fn=<MseLossBackward>)
output :  tensor([[131339.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1187384.7500, grad_fn=<MseLossBackward>)
output :  tensor([[125553.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(305826.2812, grad_fn=<MseLossBackward>)
output :  tensor([[135747.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8894e+08, grad_fn=<MseLossBackward>)
output :  tensor([[227132.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8364e+10, grad_fn=<MseLossBackward>)
output :  tensor([[192893.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1936e+10, grad_fn=<MseLossBackward>)
output :  tensor([[142118.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3173853.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128767.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(1607011.7500, grad_fn=<MseLossBackward>)
output :  tensor([[112157.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(823173.4375, grad_fn=<MseLossBackward>)
output :  tensor([[256166.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8309e+09, grad_fn=<MseLossBackward>)
output :  tensor([[133362.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2680076., grad_fn=<MseLossBackward>)
output :  tensor([[199391.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(13018228., grad_fn=<MseLossBackward>)
output :  tensor([[102299.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(6763575.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139295.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(427838.6250, grad_fn=<MseLossBackward>)
output :  tensor([[212521.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4349e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174023.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(34534720., grad_fn=<MseLossBackward>)
output :  tensor([[186888.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(3565016., grad_fn=<MseLossBackward>)
output :  tensor([[163058.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1299e+10, grad_fn=<MseLossBackward>)
output :  tensor([[303487.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9303e+08, grad_fn=<MseLossBackward>)
output :  tensor([[194974.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(8560745., grad_fn=<MseLossBackward>)
output :  tensor([[257147.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1233e+10, grad_fn=<MseLossBackward>)
output :  tensor([[224463.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7253e+09, grad_fn=<MseLossBackward>)
output :  tensor([[282559.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1862e+09, grad_fn=<MseLossBackward>)
output :  tensor([[226639.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(6968280., grad_fn=<MseLossBackward>)
output :  tensor([[222083.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8872e+10, grad_fn=<MseLossBackward>)
output :  tensor([[191952.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(25478360., grad_fn=<MseLossBackward>)
output :  tensor([[158719.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8327e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135071.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(6610362.5000, grad_fn=<MseLossBackward>)
output :  tensor([[133188.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(5342454.5000, grad_fn=<MseLossBackward>)
output :  tensor([[91737.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(543606.6875, grad_fn=<MseLossBackward>)
output :  tensor([[109380.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1904788.1250, grad_fn=<MseLossBackward>)
output :  tensor([[277152.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6778e+09, grad_fn=<MseLossBackward>)
output :  tensor([[232261.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(7498270., grad_fn=<MseLossBackward>)
output :  tensor([[148846.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(14796283., grad_fn=<MseLossBackward>)
output :  tensor([[140670.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(10053556., grad_fn=<MseLossBackward>)
output :  tensor([[174293.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(314107.7188, grad_fn=<MseLossBackward>)
output :  tensor([[145121.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(16440.0469, grad_fn=<MseLossBackward>)
output :  tensor([[165619.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3409e+08, grad_fn=<MseLossBackward>)
output :  tensor([[167223.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(4942354., grad_fn=<MseLossBackward>)
output :  tensor([[137596.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(355849.5312, grad_fn=<MseLossBackward>)
output :  tensor([[188794.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3950e+09, grad_fn=<MseLossBackward>)
output :  tensor([[113975.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(3903433.7500, grad_fn=<MseLossBackward>)
output :  tensor([[166776.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(27289360., grad_fn=<MseLossBackward>)
output :  tensor([[121017.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(1035926.3750, grad_fn=<MseLossBackward>)
output :  tensor([[87234.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(55041.5586, grad_fn=<MseLossBackward>)
output :  tensor([[179354.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(416529.0625, grad_fn=<MseLossBackward>)
output :  tensor([[112055.4922]], grad_fn=<AddmmBackward>)
loss:  tensor(4646146.5000, grad_fn=<MseLossBackward>)
output :  tensor([[239635.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(404356.8750, grad_fn=<MseLossBackward>)
output :  tensor([[245692.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(480162.3750, grad_fn=<MseLossBackward>)
output :  tensor([[134332.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(23349130., grad_fn=<MseLossBackward>)
output :  tensor([[108616.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(117135.0625, grad_fn=<MseLossBackward>)
output :  tensor([[288223.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2180e+10, grad_fn=<MseLossBackward>)
output :  tensor([[171670.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(29075.5781, grad_fn=<MseLossBackward>)
output :  tensor([[126285.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1653032.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144418.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9794e+08, grad_fn=<MseLossBackward>)
output :  tensor([[202742.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2672e+08, grad_fn=<MseLossBackward>)
output :  tensor([[138922.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(4315162.5000, grad_fn=<MseLossBackward>)
output :  tensor([[161129.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4130e+10, grad_fn=<MseLossBackward>)
output :  tensor([[157276.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(11398326., grad_fn=<MseLossBackward>)
output :  tensor([[130383.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(780889.8125, grad_fn=<MseLossBackward>)
output :  tensor([[250688.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6336e+10, grad_fn=<MseLossBackward>)
output :  tensor([[396641.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(28714526., grad_fn=<MseLossBackward>)
output :  tensor([[111231.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(4979627., grad_fn=<MseLossBackward>)
output :  tensor([[108421.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0158e+08, grad_fn=<MseLossBackward>)
output :  tensor([[160103.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(363778.6250, grad_fn=<MseLossBackward>)
output :  tensor([[129277.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1118e+08, grad_fn=<MseLossBackward>)
output :  tensor([[162905.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4921e+09, grad_fn=<MseLossBackward>)
output :  tensor([[170520.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6628e+09, grad_fn=<MseLossBackward>)
output :  tensor([[103014.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(343386.8438, grad_fn=<MseLossBackward>)
output :  tensor([[140325.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(454865.9375, grad_fn=<MseLossBackward>)
output :  tensor([[363277.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(16131268., grad_fn=<MseLossBackward>)
output :  tensor([[209178.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0090e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174488.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1022879.3750, grad_fn=<MseLossBackward>)
output :  tensor([[202999.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(9978.1367, grad_fn=<MseLossBackward>)
output :  tensor([[136398.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(6768290., grad_fn=<MseLossBackward>)
output :  tensor([[192599.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3613682.2500, grad_fn=<MseLossBackward>)
output :  tensor([[134267.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1650e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176194.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(23096134., grad_fn=<MseLossBackward>)
output :  tensor([[242763.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(582956.1250, grad_fn=<MseLossBackward>)
output :  tensor([[173092.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(822960.8125, grad_fn=<MseLossBackward>)
output :  tensor([[108809.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(654835., grad_fn=<MseLossBackward>)
output :  tensor([[262347.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(4900135.5000, grad_fn=<MseLossBackward>)
output :  tensor([[250461.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(212809.2188, grad_fn=<MseLossBackward>)
output :  tensor([[119025.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(15796278., grad_fn=<MseLossBackward>)
output :  tensor([[216078.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4717e+09, grad_fn=<MseLossBackward>)
output :  tensor([[306403.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5706e+08, grad_fn=<MseLossBackward>)
output :  tensor([[206902.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(9585.6338, grad_fn=<MseLossBackward>)
output :  tensor([[214497.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5751e+10, grad_fn=<MseLossBackward>)
output :  tensor([[159894.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(3977220., grad_fn=<MseLossBackward>)
output :  tensor([[166357.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(13191878., grad_fn=<MseLossBackward>)
output :  tensor([[163411.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(41980276., grad_fn=<MseLossBackward>)
output :  tensor([[167929.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(4285029.5000, grad_fn=<MseLossBackward>)
output :  tensor([[236291.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0054e+09, grad_fn=<MseLossBackward>)
output :  tensor([[222752.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(44932724., grad_fn=<MseLossBackward>)
output :  tensor([[159005.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4412e+08, grad_fn=<MseLossBackward>)
output :  tensor([[122160.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(704222.5625, grad_fn=<MseLossBackward>)
output :  tensor([[178326.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1759146.2500, grad_fn=<MseLossBackward>)
output :  tensor([[182819.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9568e+09, grad_fn=<MseLossBackward>)
output :  tensor([[210106.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4044e+10, grad_fn=<MseLossBackward>)
output :  tensor([[132937.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2232409.5000, grad_fn=<MseLossBackward>)
output :  tensor([[146830.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3660e+08, grad_fn=<MseLossBackward>)
output :  tensor([[276893.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(11402.2354, grad_fn=<MseLossBackward>)
output :  tensor([[87306.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(5319582., grad_fn=<MseLossBackward>)
output :  tensor([[238089.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2526361.2500, grad_fn=<MseLossBackward>)
output :  tensor([[263492.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0204e+11, grad_fn=<MseLossBackward>)
output :  tensor([[168864.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1288579.7500, grad_fn=<MseLossBackward>)
output :  tensor([[195482.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5617e+09, grad_fn=<MseLossBackward>)
output :  tensor([[152893.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(4437276.5000, grad_fn=<MseLossBackward>)
output :  tensor([[206892.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9825e+09, grad_fn=<MseLossBackward>)
output :  tensor([[127982.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1035338.0625, grad_fn=<MseLossBackward>)
output :  tensor([[143654.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1810622.5000, grad_fn=<MseLossBackward>)
output :  tensor([[168828.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9322e+08, grad_fn=<MseLossBackward>)
output :  tensor([[186926.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1158852.2500, grad_fn=<MseLossBackward>)
output :  tensor([[122348.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(13337047., grad_fn=<MseLossBackward>)
output :  tensor([[135611.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(789126.8750, grad_fn=<MseLossBackward>)
output :  tensor([[166422.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(43260628., grad_fn=<MseLossBackward>)
output :  tensor([[197612.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7445e+09, grad_fn=<MseLossBackward>)
output :  tensor([[237710.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(27978644., grad_fn=<MseLossBackward>)
output :  tensor([[151508.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(12193737., grad_fn=<MseLossBackward>)
output :  tensor([[196857.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(734582.9375, grad_fn=<MseLossBackward>)
output :  tensor([[161226.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9674e+08, grad_fn=<MseLossBackward>)
output :  tensor([[181336.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3372847., grad_fn=<MseLossBackward>)
output :  tensor([[179743.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(24585.2598, grad_fn=<MseLossBackward>)
output :  tensor([[99671.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(7134408., grad_fn=<MseLossBackward>)
output :  tensor([[173543.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1333e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134875.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(15558.6641, grad_fn=<MseLossBackward>)
output :  tensor([[117387.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(5698328.5000, grad_fn=<MseLossBackward>)
output :  tensor([[174240.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(57750.0977, grad_fn=<MseLossBackward>)
output :  tensor([[85514.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(264742.4062, grad_fn=<MseLossBackward>)
output :  tensor([[284033.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(35600612., grad_fn=<MseLossBackward>)
output :  tensor([[169192.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(17576926., grad_fn=<MseLossBackward>)
output :  tensor([[193844.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9411e+10, grad_fn=<MseLossBackward>)
output :  tensor([[249204.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7504e+08, grad_fn=<MseLossBackward>)
output :  tensor([[152592.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2535110.7500, grad_fn=<MseLossBackward>)
output :  tensor([[125148.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(1318603.6250, grad_fn=<MseLossBackward>)
output :  tensor([[117821.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(4318311.5000, grad_fn=<MseLossBackward>)
output :  tensor([[140028.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2640e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174595.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(354285.3750, grad_fn=<MseLossBackward>)
output :  tensor([[109015.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0308e+08, grad_fn=<MseLossBackward>)
output :  tensor([[210228.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1615e+10, grad_fn=<MseLossBackward>)
output :  tensor([[240733.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(586779.9375, grad_fn=<MseLossBackward>)
output :  tensor([[254713.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9734e+10, grad_fn=<MseLossBackward>)
output :  tensor([[220167.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5467e+08, grad_fn=<MseLossBackward>)
output :  tensor([[196295.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4210e+10, grad_fn=<MseLossBackward>)
output :  tensor([[190549.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(9296973., grad_fn=<MseLossBackward>)
output :  tensor([[207058.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7442e+10, grad_fn=<MseLossBackward>)
output :  tensor([[187222.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2135e+10, grad_fn=<MseLossBackward>)
output :  tensor([[176020.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(7397295., grad_fn=<MseLossBackward>)
output :  tensor([[152256.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(65864.4141, grad_fn=<MseLossBackward>)
output :  tensor([[333512.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(12160477., grad_fn=<MseLossBackward>)
output :  tensor([[207960.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(16317686., grad_fn=<MseLossBackward>)
output :  tensor([[160042.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1826.2268, grad_fn=<MseLossBackward>)
output :  tensor([[187232.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9450e+09, grad_fn=<MseLossBackward>)
output :  tensor([[107128.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(4532541., grad_fn=<MseLossBackward>)
output :  tensor([[277762.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6860e+10, grad_fn=<MseLossBackward>)
output :  tensor([[168581.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(28290266., grad_fn=<MseLossBackward>)
output :  tensor([[219603.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(37251948., grad_fn=<MseLossBackward>)
output :  tensor([[216275.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(22318834., grad_fn=<MseLossBackward>)
output :  tensor([[179655.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(207181.4375, grad_fn=<MseLossBackward>)
output :  tensor([[202921.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1258568.5000, grad_fn=<MseLossBackward>)
output :  tensor([[156859.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(3458089., grad_fn=<MseLossBackward>)
output :  tensor([[145235.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0463e+09, grad_fn=<MseLossBackward>)
output :  tensor([[118406.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(8752.4795, grad_fn=<MseLossBackward>)
output :  tensor([[139475.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(275149.4375, grad_fn=<MseLossBackward>)
output :  tensor([[146034.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(8795395., grad_fn=<MseLossBackward>)
output :  tensor([[203249.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5563e+10, grad_fn=<MseLossBackward>)
output :  tensor([[160699.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1438537.8750, grad_fn=<MseLossBackward>)
output :  tensor([[99102.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(157646.2188, grad_fn=<MseLossBackward>)
output :  tensor([[226800.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7422e+08, grad_fn=<MseLossBackward>)
output :  tensor([[184214.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5022e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173542.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(8659686., grad_fn=<MseLossBackward>)
output :  tensor([[79384.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(6839287.5000, grad_fn=<MseLossBackward>)
output :  tensor([[129890.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(1934685.3750, grad_fn=<MseLossBackward>)
output :  tensor([[217984.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(15873252., grad_fn=<MseLossBackward>)
output :  tensor([[143653.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(120343.9453, grad_fn=<MseLossBackward>)
output :  tensor([[131711.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2929767., grad_fn=<MseLossBackward>)
output :  tensor([[147531.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(24320154., grad_fn=<MseLossBackward>)
output :  tensor([[177145.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5718e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146044.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(4178511., grad_fn=<MseLossBackward>)
output :  tensor([[161814.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(3291049.5000, grad_fn=<MseLossBackward>)
output :  tensor([[215023.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(552.9846, grad_fn=<MseLossBackward>)
output :  tensor([[133890.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3468e+08, grad_fn=<MseLossBackward>)
output :  tensor([[257665.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(7102475., grad_fn=<MseLossBackward>)
output :  tensor([[159986.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(236834.3125, grad_fn=<MseLossBackward>)
output :  tensor([[129228.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(531122.1250, grad_fn=<MseLossBackward>)
output :  tensor([[97212.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(4896020.5000, grad_fn=<MseLossBackward>)
output :  tensor([[150044.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2961e+09, grad_fn=<MseLossBackward>)
output :  tensor([[180261.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(130625.7734, grad_fn=<MseLossBackward>)
output :  tensor([[120835.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(112817.2656, grad_fn=<MseLossBackward>)
output :  tensor([[189796.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5330e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145561.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3641e+09, grad_fn=<MseLossBackward>)
output :  tensor([[148683.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1480746.7500, grad_fn=<MseLossBackward>)
output :  tensor([[186854.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(801556.5000, grad_fn=<MseLossBackward>)
output :  tensor([[253901.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5347e+09, grad_fn=<MseLossBackward>)
output :  tensor([[92031.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(282874.4062, grad_fn=<MseLossBackward>)
output :  tensor([[239546.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(205988.3281, grad_fn=<MseLossBackward>)
output :  tensor([[128039.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(211765.3438, grad_fn=<MseLossBackward>)
output :  tensor([[166947.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(9.7916e+09, grad_fn=<MseLossBackward>)
output :  tensor([[114342.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0572e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175364.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(404197.9375, grad_fn=<MseLossBackward>)
output :  tensor([[164332.]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2160e+08, grad_fn=<MseLossBackward>)
output :  tensor([[154623.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8193e+08, grad_fn=<MseLossBackward>)
output :  tensor([[238596.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(162497.1719, grad_fn=<MseLossBackward>)
output :  tensor([[223817.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1684e+09, grad_fn=<MseLossBackward>)
output :  tensor([[129767.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(7659964.5000, grad_fn=<MseLossBackward>)
output :  tensor([[122790.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(10300489., grad_fn=<MseLossBackward>)
output :  tensor([[224504.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(6225882.5000, grad_fn=<MseLossBackward>)
output :  tensor([[231280.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(7397380., grad_fn=<MseLossBackward>)
output :  tensor([[223668.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(9188855., grad_fn=<MseLossBackward>)
output :  tensor([[149333.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1779014.1250, grad_fn=<MseLossBackward>)
output :  tensor([[211540.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2373477.2500, grad_fn=<MseLossBackward>)
output :  tensor([[126456.1016]], grad_fn=<AddmmBackward>)
loss:  tensor(41681248., grad_fn=<MseLossBackward>)
output :  tensor([[135009.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(6297355., grad_fn=<MseLossBackward>)
output :  tensor([[308816.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(38238764., grad_fn=<MseLossBackward>)
output :  tensor([[140387.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(375654.0625, grad_fn=<MseLossBackward>)
output :  tensor([[123166.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1547e+09, grad_fn=<MseLossBackward>)
output :  tensor([[110686.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(1408319.8750, grad_fn=<MseLossBackward>)
output :  tensor([[158689.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9073e+08, grad_fn=<MseLossBackward>)
output :  tensor([[182881.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4353e+09, grad_fn=<MseLossBackward>)
output :  tensor([[172108.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(795636.1250, grad_fn=<MseLossBackward>)
output :  tensor([[194369.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(43965188., grad_fn=<MseLossBackward>)
output :  tensor([[100531.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(282907.6250, grad_fn=<MseLossBackward>)
output :  tensor([[176023.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(8860203., grad_fn=<MseLossBackward>)
output :  tensor([[166239.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2755807.5000, grad_fn=<MseLossBackward>)
output :  tensor([[143682.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(21921270., grad_fn=<MseLossBackward>)
output :  tensor([[260301.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(9.7611e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144072.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4896e+09, grad_fn=<MseLossBackward>)
output :  tensor([[171313.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2844018.7500, grad_fn=<MseLossBackward>)
output :  tensor([[142924.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(8553614., grad_fn=<MseLossBackward>)
output :  tensor([[198631.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3490591.5000, grad_fn=<MseLossBackward>)
output :  tensor([[167446.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(6520761., grad_fn=<MseLossBackward>)
output :  tensor([[240018.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(15854706., grad_fn=<MseLossBackward>)
output :  tensor([[133593.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(822337.2500, grad_fn=<MseLossBackward>)
output :  tensor([[149728.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(143297.7344, grad_fn=<MseLossBackward>)
output :  tensor([[211828.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(10058214., grad_fn=<MseLossBackward>)
output :  tensor([[168636.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(13220610., grad_fn=<MseLossBackward>)
output :  tensor([[193185.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(17518280., grad_fn=<MseLossBackward>)
output :  tensor([[129680.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5963e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129583.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(340654.6250, grad_fn=<MseLossBackward>)
output :  tensor([[140036.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1344.8264, grad_fn=<MseLossBackward>)
output :  tensor([[203418.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3668e+09, grad_fn=<MseLossBackward>)
output :  tensor([[168264.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8371e+09, grad_fn=<MseLossBackward>)
output :  tensor([[73617.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8544e+08, grad_fn=<MseLossBackward>)
output :  tensor([[91864.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(54236320., grad_fn=<MseLossBackward>)
output :  tensor([[253429.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(18751.8789, grad_fn=<MseLossBackward>)
output :  tensor([[202156.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9887e+09, grad_fn=<MseLossBackward>)
output :  tensor([[115916.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(839528.3750, grad_fn=<MseLossBackward>)
output :  tensor([[156220.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(9.7839e+08, grad_fn=<MseLossBackward>)
output :  tensor([[209831.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0339e+08, grad_fn=<MseLossBackward>)
output :  tensor([[182072.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7313e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158171.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(10058214., grad_fn=<MseLossBackward>)
output :  tensor([[169678.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(103643.7500, grad_fn=<MseLossBackward>)
output :  tensor([[115655.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(429844.1250, grad_fn=<MseLossBackward>)
output :  tensor([[158356.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(11266617., grad_fn=<MseLossBackward>)
output :  tensor([[193747.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7298e+08, grad_fn=<MseLossBackward>)
output :  tensor([[219770.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(72975.9609, grad_fn=<MseLossBackward>)
output :  tensor([[247092.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4791e+11, grad_fn=<MseLossBackward>)
output :  tensor([[146320.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(461189.5312, grad_fn=<MseLossBackward>)
output :  tensor([[108375.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(10863.1768, grad_fn=<MseLossBackward>)
output :  tensor([[170945.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1999e+08, grad_fn=<MseLossBackward>)
output :  tensor([[150192.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(94854.3750, grad_fn=<MseLossBackward>)
output :  tensor([[237137.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(18816.1230, grad_fn=<MseLossBackward>)
output :  tensor([[112961.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(4153539.5000, grad_fn=<MseLossBackward>)
output :  tensor([[182727.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(29745.4688, grad_fn=<MseLossBackward>)
output :  tensor([[181417.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(27904476., grad_fn=<MseLossBackward>)
output :  tensor([[165674.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3816e+10, grad_fn=<MseLossBackward>)
output :  tensor([[97175.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6165e+08, grad_fn=<MseLossBackward>)
output :  tensor([[240843.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3400278.5000, grad_fn=<MseLossBackward>)
output :  tensor([[179008.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(9048910., grad_fn=<MseLossBackward>)
output :  tensor([[139360.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(408360.9375, grad_fn=<MseLossBackward>)
output :  tensor([[234340.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(435352.5312, grad_fn=<MseLossBackward>)
output :  tensor([[165391.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(5719571., grad_fn=<MseLossBackward>)
output :  tensor([[205652.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4244e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134625.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(139934.4375, grad_fn=<MseLossBackward>)
output :  tensor([[187046.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2734e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136571.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(326558.6875, grad_fn=<MseLossBackward>)
output :  tensor([[230416.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(31177566., grad_fn=<MseLossBackward>)
output :  tensor([[227362.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1245e+08, grad_fn=<MseLossBackward>)
output :  tensor([[89950.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(2497.6567, grad_fn=<MseLossBackward>)
output :  tensor([[160349.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(838311.9375, grad_fn=<MseLossBackward>)
output :  tensor([[246147.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5558e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143889.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1233210.2500, grad_fn=<MseLossBackward>)
output :  tensor([[107497.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6400e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161294.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(10277134., grad_fn=<MseLossBackward>)
output :  tensor([[144598.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(358052.6250, grad_fn=<MseLossBackward>)
output :  tensor([[130028.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3344098., grad_fn=<MseLossBackward>)
output :  tensor([[189207.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8710e+09, grad_fn=<MseLossBackward>)
output :  tensor([[123010.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(260929.4062, grad_fn=<MseLossBackward>)
output :  tensor([[150422.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2488950., grad_fn=<MseLossBackward>)
output :  tensor([[170822.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(860952., grad_fn=<MseLossBackward>)
output :  tensor([[149706.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1672818.8750, grad_fn=<MseLossBackward>)
output :  tensor([[158610.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(18401686., grad_fn=<MseLossBackward>)
output :  tensor([[136690.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6677e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130699.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1692357.1250, grad_fn=<MseLossBackward>)
output :  tensor([[153087.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9845e+08, grad_fn=<MseLossBackward>)
output :  tensor([[145618.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2149247.7500, grad_fn=<MseLossBackward>)
output :  tensor([[160161.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2523431.5000, grad_fn=<MseLossBackward>)
output :  tensor([[136494.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0726e+08, grad_fn=<MseLossBackward>)
output :  tensor([[149116.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(99964.6562, grad_fn=<MseLossBackward>)
output :  tensor([[186022.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(3911556.7500, grad_fn=<MseLossBackward>)
output :  tensor([[170792.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(3213392.2500, grad_fn=<MseLossBackward>)
output :  tensor([[181632.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2666638., grad_fn=<MseLossBackward>)
output :  tensor([[222232.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(4983149.5000, grad_fn=<MseLossBackward>)
output :  tensor([[110660.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(7621870., grad_fn=<MseLossBackward>)
output :  tensor([[137179.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5079e+08, grad_fn=<MseLossBackward>)
output :  tensor([[288469.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(6096269.5000, grad_fn=<MseLossBackward>)
output :  tensor([[116998.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(996347.0625, grad_fn=<MseLossBackward>)
output :  tensor([[174575.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0634e+09, grad_fn=<MseLossBackward>)
output :  tensor([[186304.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1702861.8750, grad_fn=<MseLossBackward>)
output :  tensor([[174347.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2438e+08, grad_fn=<MseLossBackward>)
output :  tensor([[252193.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2012e+08, grad_fn=<MseLossBackward>)
output :  tensor([[225037.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(9226691., grad_fn=<MseLossBackward>)
output :  tensor([[121146.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3246e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172905.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9622e+08, grad_fn=<MseLossBackward>)
output :  tensor([[125272.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1620369.8750, grad_fn=<MseLossBackward>)
output :  tensor([[183775.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5027e+10, grad_fn=<MseLossBackward>)
output :  tensor([[153221.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(49221.5820, grad_fn=<MseLossBackward>)
output :  tensor([[152739.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(38925900., grad_fn=<MseLossBackward>)
output :  tensor([[203668.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(6925532.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144567.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4561e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176403.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(162421.5938, grad_fn=<MseLossBackward>)
output :  tensor([[257785.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7152e+08, grad_fn=<MseLossBackward>)
output :  tensor([[147341.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(433581.0938, grad_fn=<MseLossBackward>)
output :  tensor([[201237.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(2038782.3750, grad_fn=<MseLossBackward>)
output :  tensor([[162302.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(5532198., grad_fn=<MseLossBackward>)
output :  tensor([[120789.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0752e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137813.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(4258999.5000, grad_fn=<MseLossBackward>)
output :  tensor([[182572.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2036507.3750, grad_fn=<MseLossBackward>)
output :  tensor([[197925.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(62816772., grad_fn=<MseLossBackward>)
output :  tensor([[233293.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1033e+09, grad_fn=<MseLossBackward>)
output :  tensor([[257725.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(526236.8750, grad_fn=<MseLossBackward>)
output :  tensor([[192782.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5931e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143954.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7514e+09, grad_fn=<MseLossBackward>)
output :  tensor([[142053.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(5985821., grad_fn=<MseLossBackward>)
output :  tensor([[70437.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2646e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135915.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(838569.4375, grad_fn=<MseLossBackward>)
output :  tensor([[128773.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(15996.3213, grad_fn=<MseLossBackward>)
output :  tensor([[154360.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(129622.5000, grad_fn=<MseLossBackward>)
output :  tensor([[131167.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(17367666., grad_fn=<MseLossBackward>)
output :  tensor([[76158.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(116745.0078, grad_fn=<MseLossBackward>)
output :  tensor([[86704.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(22132026., grad_fn=<MseLossBackward>)
output :  tensor([[236114.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(16925382., grad_fn=<MseLossBackward>)
output :  tensor([[140108.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6225e+08, grad_fn=<MseLossBackward>)
output :  tensor([[132542.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(4170593.5000, grad_fn=<MseLossBackward>)
output :  tensor([[167268.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(72075.4688, grad_fn=<MseLossBackward>)
output :  tensor([[231881.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(9727966., grad_fn=<MseLossBackward>)
output :  tensor([[182388.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(95085352., grad_fn=<MseLossBackward>)
output :  tensor([[152925.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(9452550., grad_fn=<MseLossBackward>)
output :  tensor([[198017.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(13696.3135, grad_fn=<MseLossBackward>)
output :  tensor([[206974.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(9.0155e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137237.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(56183.8125, grad_fn=<MseLossBackward>)
output :  tensor([[155496.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(246264.0625, grad_fn=<MseLossBackward>)
output :  tensor([[131892.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(16874894., grad_fn=<MseLossBackward>)
output :  tensor([[202635.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4879e+08, grad_fn=<MseLossBackward>)
output :  tensor([[151790.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(4882028.5000, grad_fn=<MseLossBackward>)
output :  tensor([[133239.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5793e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146301.]], grad_fn=<AddmmBackward>)
loss:  tensor(1962801., grad_fn=<MseLossBackward>)
output :  tensor([[204300.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(59287112., grad_fn=<MseLossBackward>)
output :  tensor([[98842.1484]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8366e+08, grad_fn=<MseLossBackward>)
output :  tensor([[164228.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(10704144., grad_fn=<MseLossBackward>)
output :  tensor([[126965.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(1070659., grad_fn=<MseLossBackward>)
output :  tensor([[146600.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(159363.1406, grad_fn=<MseLossBackward>)
output :  tensor([[102536.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6123e+09, grad_fn=<MseLossBackward>)
output :  tensor([[138617.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1249819.2500, grad_fn=<MseLossBackward>)
output :  tensor([[234083.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(3671295.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145287.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(82782.0781, grad_fn=<MseLossBackward>)
output :  tensor([[139065.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2450643.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163223.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2407e+09, grad_fn=<MseLossBackward>)
output :  tensor([[271336.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(44403064., grad_fn=<MseLossBackward>)
output :  tensor([[178512.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(12338095., grad_fn=<MseLossBackward>)
output :  tensor([[103481.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(497388.5938, grad_fn=<MseLossBackward>)
output :  tensor([[202798.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5804e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161063.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4256033.5000, grad_fn=<MseLossBackward>)
output :  tensor([[165191.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5044e+10, grad_fn=<MseLossBackward>)
output :  tensor([[98129.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(28971.7637, grad_fn=<MseLossBackward>)
output :  tensor([[122777.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(675851., grad_fn=<MseLossBackward>)
output :  tensor([[154211.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3198173.2500, grad_fn=<MseLossBackward>)
output :  tensor([[142631.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(6926848.5000, grad_fn=<MseLossBackward>)
output :  tensor([[198824.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1382939.2500, grad_fn=<MseLossBackward>)
output :  tensor([[143870.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3498653.2500, grad_fn=<MseLossBackward>)
output :  tensor([[264584.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(5311152.5000, grad_fn=<MseLossBackward>)
output :  tensor([[126542.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1251e+09, grad_fn=<MseLossBackward>)
output :  tensor([[162207.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(10843746., grad_fn=<MseLossBackward>)
output :  tensor([[187376.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1262638.5000, grad_fn=<MseLossBackward>)
output :  tensor([[121809.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3946e+08, grad_fn=<MseLossBackward>)
output :  tensor([[250609.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(371776., grad_fn=<MseLossBackward>)
output :  tensor([[161342.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5830e+08, grad_fn=<MseLossBackward>)
output :  tensor([[243554.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(3223988.5000, grad_fn=<MseLossBackward>)
output :  tensor([[143435.]], grad_fn=<AddmmBackward>)
loss:  tensor(319225., grad_fn=<MseLossBackward>)
output :  tensor([[207895.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(4430564.5000, grad_fn=<MseLossBackward>)
output :  tensor([[177570.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(26736332., grad_fn=<MseLossBackward>)
output :  tensor([[152947.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1107164.2500, grad_fn=<MseLossBackward>)
output :  tensor([[116543.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(2120959.7500, grad_fn=<MseLossBackward>)
output :  tensor([[241465.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0816e+09, grad_fn=<MseLossBackward>)
output :  tensor([[235657.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(18861242., grad_fn=<MseLossBackward>)
output :  tensor([[152560.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(603680.4375, grad_fn=<MseLossBackward>)
output :  tensor([[252902.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(3990693., grad_fn=<MseLossBackward>)
output :  tensor([[122062.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(57124544., grad_fn=<MseLossBackward>)
output :  tensor([[174275.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2973361.2500, grad_fn=<MseLossBackward>)
output :  tensor([[158906.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1195810.6250, grad_fn=<MseLossBackward>)
output :  tensor([[128662.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(5461751.5000, grad_fn=<MseLossBackward>)
output :  tensor([[191980.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9038e+09, grad_fn=<MseLossBackward>)
output :  tensor([[167563.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(12696082., grad_fn=<MseLossBackward>)
output :  tensor([[164111.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1234633.5000, grad_fn=<MseLossBackward>)
output :  tensor([[158320.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(102780.3516, grad_fn=<MseLossBackward>)
output :  tensor([[152888.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(8928611., grad_fn=<MseLossBackward>)
output :  tensor([[169683.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6220e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157722.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(5188145., grad_fn=<MseLossBackward>)
output :  tensor([[379565.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(19398794., grad_fn=<MseLossBackward>)
output :  tensor([[135101.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(65641140., grad_fn=<MseLossBackward>)
output :  tensor([[131219.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0903e+09, grad_fn=<MseLossBackward>)
output :  tensor([[275739.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(29962966., grad_fn=<MseLossBackward>)
output :  tensor([[165162.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(10001802., grad_fn=<MseLossBackward>)
output :  tensor([[129888.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(88150824., grad_fn=<MseLossBackward>)
output :  tensor([[227851.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(17213164., grad_fn=<MseLossBackward>)
output :  tensor([[181489.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(978522.8125, grad_fn=<MseLossBackward>)
output :  tensor([[153833.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(3360404.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145298.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(88850.5703, grad_fn=<MseLossBackward>)
output :  tensor([[153719.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8288e+08, grad_fn=<MseLossBackward>)
output :  tensor([[104069.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(16560258., grad_fn=<MseLossBackward>)
output :  tensor([[73327.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7763e+08, grad_fn=<MseLossBackward>)
output :  tensor([[164273.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(527847.6875, grad_fn=<MseLossBackward>)
output :  tensor([[190484.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4074e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157834.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(27478.2422, grad_fn=<MseLossBackward>)
output :  tensor([[163841.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(40214624., grad_fn=<MseLossBackward>)
output :  tensor([[137425.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(623.4385, grad_fn=<MseLossBackward>)
output :  tensor([[210605.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(21670188., grad_fn=<MseLossBackward>)
output :  tensor([[141005.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(9035566., grad_fn=<MseLossBackward>)
output :  tensor([[183347.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6041e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145587.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(170298.0781, grad_fn=<MseLossBackward>)
output :  tensor([[110398.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5067e+08, grad_fn=<MseLossBackward>)
output :  tensor([[93292.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(500998.5312, grad_fn=<MseLossBackward>)
output :  tensor([[175624.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(390332.0938, grad_fn=<MseLossBackward>)
output :  tensor([[256438.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(15691873., grad_fn=<MseLossBackward>)
output :  tensor([[142853.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1831074.1250, grad_fn=<MseLossBackward>)
output :  tensor([[159989.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(8962.7637, grad_fn=<MseLossBackward>)
output :  tensor([[133921.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2021328.6250, grad_fn=<MseLossBackward>)
output :  tensor([[150056.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(309866.1875, grad_fn=<MseLossBackward>)
output :  tensor([[173709.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(33748292., grad_fn=<MseLossBackward>)
output :  tensor([[125506.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2229889., grad_fn=<MseLossBackward>)
output :  tensor([[169361.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(5.9347e+08, grad_fn=<MseLossBackward>)
output :  tensor([[156487.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(262912.5625, grad_fn=<MseLossBackward>)
output :  tensor([[120212.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(13781322., grad_fn=<MseLossBackward>)
output :  tensor([[161605.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0971e+09, grad_fn=<MseLossBackward>)
output :  tensor([[55611.3477]], grad_fn=<AddmmBackward>)
loss:  tensor(13041832., grad_fn=<MseLossBackward>)
output :  tensor([[234148.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1390e+09, grad_fn=<MseLossBackward>)
output :  tensor([[201049.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2416.3369, grad_fn=<MseLossBackward>)
output :  tensor([[183550.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2102182.7500, grad_fn=<MseLossBackward>)
output :  tensor([[104803.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1431761.8750, grad_fn=<MseLossBackward>)
output :  tensor([[88850.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(3423367.2500, grad_fn=<MseLossBackward>)
output :  tensor([[138737.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1594143., grad_fn=<MseLossBackward>)
output :  tensor([[222630.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(5.0935e+09, grad_fn=<MseLossBackward>)
output :  tensor([[206349.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1324693.1250, grad_fn=<MseLossBackward>)
output :  tensor([[163851.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1318298.6250, grad_fn=<MseLossBackward>)
output :  tensor([[174274.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2312e+09, grad_fn=<MseLossBackward>)
output :  tensor([[189121.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(771405.3750, grad_fn=<MseLossBackward>)
output :  tensor([[90219.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(10367243., grad_fn=<MseLossBackward>)
output :  tensor([[142249.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(5062008., grad_fn=<MseLossBackward>)
output :  tensor([[114259.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(14132254., grad_fn=<MseLossBackward>)
output :  tensor([[147441.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3182e+08, grad_fn=<MseLossBackward>)
output :  tensor([[172993.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7634e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194220.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1620e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177676.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(5398507., grad_fn=<MseLossBackward>)
output :  tensor([[97859.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(1849196.2500, grad_fn=<MseLossBackward>)
output :  tensor([[118071.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(326996.3438, grad_fn=<MseLossBackward>)
output :  tensor([[160781.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3912e+08, grad_fn=<MseLossBackward>)
output :  tensor([[198575.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2029155.7500, grad_fn=<MseLossBackward>)
output :  tensor([[140953.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(9278878., grad_fn=<MseLossBackward>)
train_loss: [2.5477281e+09]
epoch_result tensor([0.])
output :  tensor([[161796.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(10867530., grad_fn=<MseLossBackward>)
output :  tensor([[118709.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(10826670., grad_fn=<MseLossBackward>)
output :  tensor([[192364.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3373593.2500, grad_fn=<MseLossBackward>)
output :  tensor([[177435.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(189782.7500, grad_fn=<MseLossBackward>)
output :  tensor([[151071.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2513e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133701.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(32506212., grad_fn=<MseLossBackward>)
output :  tensor([[140955.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1999.7666, grad_fn=<MseLossBackward>)
output :  tensor([[122071.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(9431905., grad_fn=<MseLossBackward>)
output :  tensor([[63063.1523]], grad_fn=<AddmmBackward>)
loss:  tensor(20822360., grad_fn=<MseLossBackward>)
output :  tensor([[165375.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(390273.5312, grad_fn=<MseLossBackward>)
output :  tensor([[147413.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(54963688., grad_fn=<MseLossBackward>)
output :  tensor([[224037.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(927158.3750, grad_fn=<MseLossBackward>)
output :  tensor([[169876.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(767923.6250, grad_fn=<MseLossBackward>)
output :  tensor([[251501.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3244557.7500, grad_fn=<MseLossBackward>)
output :  tensor([[55516.3477]], grad_fn=<AddmmBackward>)
loss:  tensor(266614.9062, grad_fn=<MseLossBackward>)
output :  tensor([[160311.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5000e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176080.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1167210.1250, grad_fn=<MseLossBackward>)
output :  tensor([[159732.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(10448955., grad_fn=<MseLossBackward>)
output :  tensor([[276096.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1202038.1250, grad_fn=<MseLossBackward>)
output :  tensor([[194920.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(4322696., grad_fn=<MseLossBackward>)
output :  tensor([[138184.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5249e+10, grad_fn=<MseLossBackward>)
output :  tensor([[194808.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(863825., grad_fn=<MseLossBackward>)
output :  tensor([[179904.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0246e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151291.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(84926.7109, grad_fn=<MseLossBackward>)
output :  tensor([[173098.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(9601767., grad_fn=<MseLossBackward>)
output :  tensor([[86719.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(1741843.1250, grad_fn=<MseLossBackward>)
output :  tensor([[171809.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4586e+09, grad_fn=<MseLossBackward>)
output :  tensor([[185603.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(364117.9688, grad_fn=<MseLossBackward>)
output :  tensor([[209203.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1433e+09, grad_fn=<MseLossBackward>)
output :  tensor([[108233.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(3119446., grad_fn=<MseLossBackward>)
output :  tensor([[171867.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(753234.1250, grad_fn=<MseLossBackward>)
output :  tensor([[137527.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1054761.1250, grad_fn=<MseLossBackward>)
output :  tensor([[132029.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(9179006., grad_fn=<MseLossBackward>)
output :  tensor([[120329.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(687720.3750, grad_fn=<MseLossBackward>)
output :  tensor([[144421.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5193e+08, grad_fn=<MseLossBackward>)
output :  tensor([[168533.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1452e+10, grad_fn=<MseLossBackward>)
output :  tensor([[151916.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(4911764., grad_fn=<MseLossBackward>)
output :  tensor([[181247.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1557387., grad_fn=<MseLossBackward>)
output :  tensor([[145254.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(18099840., grad_fn=<MseLossBackward>)
output :  tensor([[105555.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4198e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135689.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2902e+09, grad_fn=<MseLossBackward>)
output :  tensor([[135430.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(185034.4062, grad_fn=<MseLossBackward>)
output :  tensor([[127601.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(362319.3438, grad_fn=<MseLossBackward>)
output :  tensor([[223548.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2105763.7500, grad_fn=<MseLossBackward>)
output :  tensor([[132645.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(156370.8125, grad_fn=<MseLossBackward>)
output :  tensor([[147946.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1110520.7500, grad_fn=<MseLossBackward>)
output :  tensor([[111430.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(324445.9375, grad_fn=<MseLossBackward>)
output :  tensor([[158065.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3743862.2500, grad_fn=<MseLossBackward>)
output :  tensor([[144281.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5724e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193882.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(3542100.5000, grad_fn=<MseLossBackward>)
output :  tensor([[136371.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(3690781.2500, grad_fn=<MseLossBackward>)
output :  tensor([[99958.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0084e+08, grad_fn=<MseLossBackward>)
output :  tensor([[232330.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2786343.5000, grad_fn=<MseLossBackward>)
output :  tensor([[168644.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0111e+09, grad_fn=<MseLossBackward>)
output :  tensor([[155910.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(9542404., grad_fn=<MseLossBackward>)
output :  tensor([[204035.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8380e+10, grad_fn=<MseLossBackward>)
output :  tensor([[250607.]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0690e+10, grad_fn=<MseLossBackward>)
output :  tensor([[142048.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2107850.2500, grad_fn=<MseLossBackward>)
output :  tensor([[132923.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1159558.7500, grad_fn=<MseLossBackward>)
output :  tensor([[157942.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(8660053., grad_fn=<MseLossBackward>)
output :  tensor([[135397.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(29127778., grad_fn=<MseLossBackward>)
output :  tensor([[178922.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5735e+09, grad_fn=<MseLossBackward>)
output :  tensor([[182524.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2481314., grad_fn=<MseLossBackward>)
output :  tensor([[164477.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(8862901., grad_fn=<MseLossBackward>)
output :  tensor([[145177.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(4742050.5000, grad_fn=<MseLossBackward>)
output :  tensor([[141968.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(282841.1562, grad_fn=<MseLossBackward>)
output :  tensor([[143091.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3640523.7500, grad_fn=<MseLossBackward>)
output :  tensor([[174228.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2847e+09, grad_fn=<MseLossBackward>)
output :  tensor([[193955.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3103e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136623.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(15352.7588, grad_fn=<MseLossBackward>)
output :  tensor([[171404.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(245055.9375, grad_fn=<MseLossBackward>)
output :  tensor([[177935.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(9393650., grad_fn=<MseLossBackward>)
output :  tensor([[118833.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(14695842., grad_fn=<MseLossBackward>)
output :  tensor([[223062.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(4253068.5000, grad_fn=<MseLossBackward>)
output :  tensor([[181924.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2483086.5000, grad_fn=<MseLossBackward>)
output :  tensor([[127538.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(4154909., grad_fn=<MseLossBackward>)
output :  tensor([[195111.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1927368.2500, grad_fn=<MseLossBackward>)
output :  tensor([[172582.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(5369647.5000, grad_fn=<MseLossBackward>)
output :  tensor([[210650.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0835e+10, grad_fn=<MseLossBackward>)
output :  tensor([[211365.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(133304.8594, grad_fn=<MseLossBackward>)
output :  tensor([[162936.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0199e+09, grad_fn=<MseLossBackward>)
output :  tensor([[190752.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(14040243., grad_fn=<MseLossBackward>)
output :  tensor([[113636.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(404694.7812, grad_fn=<MseLossBackward>)
output :  tensor([[114497.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(3991972.7500, grad_fn=<MseLossBackward>)
output :  tensor([[110637.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1855639.8750, grad_fn=<MseLossBackward>)
output :  tensor([[147234.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(188613.7812, grad_fn=<MseLossBackward>)
output :  tensor([[160930.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3020e+10, grad_fn=<MseLossBackward>)
output :  tensor([[179584.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(172315.7969, grad_fn=<MseLossBackward>)
output :  tensor([[129194.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2871965.7500, grad_fn=<MseLossBackward>)
output :  tensor([[143579.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2017154.5000, grad_fn=<MseLossBackward>)
output :  tensor([[184129.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4236e+09, grad_fn=<MseLossBackward>)
output :  tensor([[118704.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(3255402.7500, grad_fn=<MseLossBackward>)
output :  tensor([[199785.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(7760229., grad_fn=<MseLossBackward>)
output :  tensor([[145532.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(283473.0625, grad_fn=<MseLossBackward>)
output :  tensor([[214955.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(4223217.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128750.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(7564992.5000, grad_fn=<MseLossBackward>)
output :  tensor([[247619.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(502060.8125, grad_fn=<MseLossBackward>)
output :  tensor([[239610.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0602e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146157.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1779e+08, grad_fn=<MseLossBackward>)
output :  tensor([[84549.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5458e+08, grad_fn=<MseLossBackward>)
output :  tensor([[196604.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1302e+09, grad_fn=<MseLossBackward>)
output :  tensor([[84665.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(13434745., grad_fn=<MseLossBackward>)
output :  tensor([[139438.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(3788.0178, grad_fn=<MseLossBackward>)
output :  tensor([[75280.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(48067.1367, grad_fn=<MseLossBackward>)
output :  tensor([[144369.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2006826.3750, grad_fn=<MseLossBackward>)
output :  tensor([[176023.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(559.6182, grad_fn=<MseLossBackward>)
output :  tensor([[152244.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1576711.8750, grad_fn=<MseLossBackward>)
output :  tensor([[110892.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(12198157., grad_fn=<MseLossBackward>)
output :  tensor([[204534.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2369e+10, grad_fn=<MseLossBackward>)
output :  tensor([[128349.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(22535.1699, grad_fn=<MseLossBackward>)
output :  tensor([[271193.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(77557744., grad_fn=<MseLossBackward>)
output :  tensor([[307165.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(8034036., grad_fn=<MseLossBackward>)
output :  tensor([[106922.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(333948.5312, grad_fn=<MseLossBackward>)
output :  tensor([[169767.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(7465788., grad_fn=<MseLossBackward>)
output :  tensor([[133314.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4083e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135294.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(13731425., grad_fn=<MseLossBackward>)
output :  tensor([[129855.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(155802.8906, grad_fn=<MseLossBackward>)
output :  tensor([[127975.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(8853228., grad_fn=<MseLossBackward>)
output :  tensor([[135197.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6034e+08, grad_fn=<MseLossBackward>)
output :  tensor([[226662.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8548e+10, grad_fn=<MseLossBackward>)
output :  tensor([[192678.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1999e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144522.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(387895.4062, grad_fn=<MseLossBackward>)
output :  tensor([[127251.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(61604.7930, grad_fn=<MseLossBackward>)
output :  tensor([[109825.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2028933.1250, grad_fn=<MseLossBackward>)
output :  tensor([[261704.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1760e+09, grad_fn=<MseLossBackward>)
output :  tensor([[135115.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(13293.3691, grad_fn=<MseLossBackward>)
output :  tensor([[206378.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(11413946., grad_fn=<MseLossBackward>)
output :  tensor([[107508.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(6806677., grad_fn=<MseLossBackward>)
output :  tensor([[140639.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(475776.6250, grad_fn=<MseLossBackward>)
output :  tensor([[209611.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2166e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178872.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1056141.6250, grad_fn=<MseLossBackward>)
output :  tensor([[186612.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2601013., grad_fn=<MseLossBackward>)
output :  tensor([[162132.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1570e+10, grad_fn=<MseLossBackward>)
output :  tensor([[304129.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(9.5299e+08, grad_fn=<MseLossBackward>)
output :  tensor([[196246.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2732615.7500, grad_fn=<MseLossBackward>)
output :  tensor([[257899.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1014e+10, grad_fn=<MseLossBackward>)
output :  tensor([[227904.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4512e+09, grad_fn=<MseLossBackward>)
output :  tensor([[289326.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6584e+08, grad_fn=<MseLossBackward>)
output :  tensor([[221511.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(6192710., grad_fn=<MseLossBackward>)
output :  tensor([[221782.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8974e+10, grad_fn=<MseLossBackward>)
output :  tensor([[196489.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(260817.6875, grad_fn=<MseLossBackward>)
output :  tensor([[157894.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3489e+08, grad_fn=<MseLossBackward>)
output :  tensor([[129641.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(8171737., grad_fn=<MseLossBackward>)
output :  tensor([[137699.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(4836563., grad_fn=<MseLossBackward>)
output :  tensor([[91705.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(497796.4062, grad_fn=<MseLossBackward>)
output :  tensor([[107085.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(835496., grad_fn=<MseLossBackward>)
output :  tensor([[277824.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6088e+09, grad_fn=<MseLossBackward>)
output :  tensor([[237135.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(4560827.5000, grad_fn=<MseLossBackward>)
output :  tensor([[143786.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1472999.3750, grad_fn=<MseLossBackward>)
output :  tensor([[135876.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2637274.5000, grad_fn=<MseLossBackward>)
output :  tensor([[175115.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1911435.8750, grad_fn=<MseLossBackward>)
output :  tensor([[147821.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(6610282., grad_fn=<MseLossBackward>)
output :  tensor([[166397.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8977e+08, grad_fn=<MseLossBackward>)
output :  tensor([[167642.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(6984788.5000, grad_fn=<MseLossBackward>)
output :  tensor([[137223.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(50120.0156, grad_fn=<MseLossBackward>)
output :  tensor([[188491.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3548e+09, grad_fn=<MseLossBackward>)
output :  tensor([[111087.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(832656.2500, grad_fn=<MseLossBackward>)
output :  tensor([[172637.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(406725.0625, grad_fn=<MseLossBackward>)
output :  tensor([[120306.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(93932.6719, grad_fn=<MseLossBackward>)
output :  tensor([[87890.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(792572.8750, grad_fn=<MseLossBackward>)
output :  tensor([[178763.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1528314., grad_fn=<MseLossBackward>)
output :  tensor([[111108.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1461378.7500, grad_fn=<MseLossBackward>)
output :  tensor([[236044.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(8733503., grad_fn=<MseLossBackward>)
output :  tensor([[242381.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(6857033., grad_fn=<MseLossBackward>)
output :  tensor([[128843.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(430582.0312, grad_fn=<MseLossBackward>)
output :  tensor([[114517.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(30895532., grad_fn=<MseLossBackward>)
output :  tensor([[289440.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1819e+10, grad_fn=<MseLossBackward>)
output :  tensor([[169429.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(4288005.5000, grad_fn=<MseLossBackward>)
output :  tensor([[124616.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(147174.1406, grad_fn=<MseLossBackward>)
output :  tensor([[144203.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8663e+08, grad_fn=<MseLossBackward>)
output :  tensor([[203407.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1221e+08, grad_fn=<MseLossBackward>)
output :  tensor([[140942.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(3362.1877, grad_fn=<MseLossBackward>)
output :  tensor([[161179.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4118e+10, grad_fn=<MseLossBackward>)
output :  tensor([[152653.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1553879.1250, grad_fn=<MseLossBackward>)
output :  tensor([[130658.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1342520.5000, grad_fn=<MseLossBackward>)
output :  tensor([[251875.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6034e+10, grad_fn=<MseLossBackward>)
output :  tensor([[400443.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2422595., grad_fn=<MseLossBackward>)
output :  tensor([[108352.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(419215.7812, grad_fn=<MseLossBackward>)
output :  tensor([[119979.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(2188666., grad_fn=<MseLossBackward>)
output :  tensor([[159434.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(4275.9336, grad_fn=<MseLossBackward>)
output :  tensor([[128911.4766]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2943e+08, grad_fn=<MseLossBackward>)
output :  tensor([[162165.]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5802e+09, grad_fn=<MseLossBackward>)
output :  tensor([[172633.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9229e+09, grad_fn=<MseLossBackward>)
output :  tensor([[107034.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(11793107., grad_fn=<MseLossBackward>)
output :  tensor([[142336.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1785814.6250, grad_fn=<MseLossBackward>)
output :  tensor([[364450.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(8084781.5000, grad_fn=<MseLossBackward>)
output :  tensor([[211193.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8324e+09, grad_fn=<MseLossBackward>)
output :  tensor([[180360.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(23620360., grad_fn=<MseLossBackward>)
output :  tensor([[202601.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(89111.5781, grad_fn=<MseLossBackward>)
output :  tensor([[141132.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(4548689., grad_fn=<MseLossBackward>)
output :  tensor([[197841.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(11164265., grad_fn=<MseLossBackward>)
output :  tensor([[133848.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9426e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180397.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(363081.5625, grad_fn=<MseLossBackward>)
output :  tensor([[241241.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(574966.7500, grad_fn=<MseLossBackward>)
output :  tensor([[172401.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2556501.2500, grad_fn=<MseLossBackward>)
output :  tensor([[107476.]], grad_fn=<AddmmBackward>)
loss:  tensor(274576., grad_fn=<MseLossBackward>)
output :  tensor([[266207.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2711271., grad_fn=<MseLossBackward>)
output :  tensor([[251908.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3642014.5000, grad_fn=<MseLossBackward>)
output :  tensor([[122939.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(3620.6545, grad_fn=<MseLossBackward>)
output :  tensor([[216650.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4046e+09, grad_fn=<MseLossBackward>)
output :  tensor([[306717.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4532e+08, grad_fn=<MseLossBackward>)
output :  tensor([[209308.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(5328883.5000, grad_fn=<MseLossBackward>)
output :  tensor([[216089.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5354e+10, grad_fn=<MseLossBackward>)
output :  tensor([[158179.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(78094.0469, grad_fn=<MseLossBackward>)
output :  tensor([[171405.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2002269.2500, grad_fn=<MseLossBackward>)
output :  tensor([[159847.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(8499958., grad_fn=<MseLossBackward>)
output :  tensor([[169421.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(334734.5625, grad_fn=<MseLossBackward>)
output :  tensor([[240307.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6686e+08, grad_fn=<MseLossBackward>)
output :  tensor([[226449.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(9041203., grad_fn=<MseLossBackward>)
output :  tensor([[161043.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9722e+08, grad_fn=<MseLossBackward>)
output :  tensor([[120538.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(6060982.5000, grad_fn=<MseLossBackward>)
output :  tensor([[177249.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(62375.0625, grad_fn=<MseLossBackward>)
output :  tensor([[182460.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0123e+09, grad_fn=<MseLossBackward>)
output :  tensor([[210517.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3893e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134660.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(52412.3789, grad_fn=<MseLossBackward>)
output :  tensor([[148387.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1759e+08, grad_fn=<MseLossBackward>)
output :  tensor([[280695.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(13656489., grad_fn=<MseLossBackward>)
output :  tensor([[88119.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(9729964., grad_fn=<MseLossBackward>)
output :  tensor([[234166.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(5445295., grad_fn=<MseLossBackward>)
output :  tensor([[264825.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0119e+11, grad_fn=<MseLossBackward>)
output :  tensor([[172420.]], grad_fn=<AddmmBackward>)
loss:  tensor(5856400., grad_fn=<MseLossBackward>)
output :  tensor([[196513.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4812e+09, grad_fn=<MseLossBackward>)
output :  tensor([[156460.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2134292.7500, grad_fn=<MseLossBackward>)
output :  tensor([[206721.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0042e+09, grad_fn=<MseLossBackward>)
output :  tensor([[132115.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(9706535., grad_fn=<MseLossBackward>)
output :  tensor([[152593.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(57665512., grad_fn=<MseLossBackward>)
output :  tensor([[172306.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(8.8842e+08, grad_fn=<MseLossBackward>)
output :  tensor([[186091.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(58397.7422, grad_fn=<MseLossBackward>)
output :  tensor([[128707.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(7328526., grad_fn=<MseLossBackward>)
output :  tensor([[139746.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(10540574., grad_fn=<MseLossBackward>)
output :  tensor([[172859.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(19661.2969, grad_fn=<MseLossBackward>)
output :  tensor([[202836.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2244e+09, grad_fn=<MseLossBackward>)
output :  tensor([[237612.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(29029366., grad_fn=<MseLossBackward>)
output :  tensor([[151665.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(11116390., grad_fn=<MseLossBackward>)
output :  tensor([[199264.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(10657470., grad_fn=<MseLossBackward>)
output :  tensor([[159185.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3061e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179379.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(14430.0156, grad_fn=<MseLossBackward>)
output :  tensor([[183159.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(10621998., grad_fn=<MseLossBackward>)
output :  tensor([[97479.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(230055.1250, grad_fn=<MseLossBackward>)
output :  tensor([[171999.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1664e+10, grad_fn=<MseLossBackward>)
output :  tensor([[135929.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(864464.1250, grad_fn=<MseLossBackward>)
output :  tensor([[119102.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(16828456., grad_fn=<MseLossBackward>)
output :  tensor([[170327.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(13487371., grad_fn=<MseLossBackward>)
output :  tensor([[85354.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(125559.4922, grad_fn=<MseLossBackward>)
output :  tensor([[290942.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(888424.0625, grad_fn=<MseLossBackward>)
output :  tensor([[169956.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(24567666., grad_fn=<MseLossBackward>)
output :  tensor([[190932.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0231e+10, grad_fn=<MseLossBackward>)
output :  tensor([[247339.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5984e+08, grad_fn=<MseLossBackward>)
output :  tensor([[149527.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2167428., grad_fn=<MseLossBackward>)
output :  tensor([[120679.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(11025409., grad_fn=<MseLossBackward>)
output :  tensor([[124106.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(17690568., grad_fn=<MseLossBackward>)
output :  tensor([[140380.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4419e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173842.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(24845.6406, grad_fn=<MseLossBackward>)
output :  tensor([[106675.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8443e+08, grad_fn=<MseLossBackward>)
output :  tensor([[213392.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0943e+10, grad_fn=<MseLossBackward>)
output :  tensor([[249168.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(58805892., grad_fn=<MseLossBackward>)
output :  tensor([[252914.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0243e+10, grad_fn=<MseLossBackward>)
output :  tensor([[221157.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1836e+08, grad_fn=<MseLossBackward>)
output :  tensor([[196029.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4273e+10, grad_fn=<MseLossBackward>)
output :  tensor([[187448.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2618.5608, grad_fn=<MseLossBackward>)
output :  tensor([[205956.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7923e+10, grad_fn=<MseLossBackward>)
output :  tensor([[189555.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1446e+10, grad_fn=<MseLossBackward>)
output :  tensor([[176637.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(4418995., grad_fn=<MseLossBackward>)
output :  tensor([[149037.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(8778350., grad_fn=<MseLossBackward>)
output :  tensor([[330659.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(40202336., grad_fn=<MseLossBackward>)
output :  tensor([[209936.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(4257387.5000, grad_fn=<MseLossBackward>)
output :  tensor([[156913.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(9526675., grad_fn=<MseLossBackward>)
output :  tensor([[187531.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9126e+09, grad_fn=<MseLossBackward>)
output :  tensor([[103824.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(1380863.6250, grad_fn=<MseLossBackward>)
output :  tensor([[279097.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6122e+10, grad_fn=<MseLossBackward>)
output :  tensor([[170443.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(11945016., grad_fn=<MseLossBackward>)
output :  tensor([[210673.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(7990250.5000, grad_fn=<MseLossBackward>)
output :  tensor([[216568.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(19635284., grad_fn=<MseLossBackward>)
output :  tensor([[179210.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(102.8323, grad_fn=<MseLossBackward>)
output :  tensor([[198862.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(8628355., grad_fn=<MseLossBackward>)
output :  tensor([[157757.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(7602600., grad_fn=<MseLossBackward>)
output :  tensor([[145547.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0746e+09, grad_fn=<MseLossBackward>)
output :  tensor([[120647.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(4612024.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139974.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(634.4102, grad_fn=<MseLossBackward>)
output :  tensor([[146232.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(7658278., grad_fn=<MseLossBackward>)
output :  tensor([[202934.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5641e+10, grad_fn=<MseLossBackward>)
output :  tensor([[161767.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(5141485.5000, grad_fn=<MseLossBackward>)
output :  tensor([[101642.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(4589971.5000, grad_fn=<MseLossBackward>)
output :  tensor([[224596.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3727e+08, grad_fn=<MseLossBackward>)
output :  tensor([[182489.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8864e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176084.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(160475.3594, grad_fn=<MseLossBackward>)
output :  tensor([[85213.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(10329495., grad_fn=<MseLossBackward>)
output :  tensor([[131487.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(8925530., grad_fn=<MseLossBackward>)
output :  tensor([[216924.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(8551695., grad_fn=<MseLossBackward>)
output :  tensor([[143327.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(451857.0312, grad_fn=<MseLossBackward>)
output :  tensor([[131101.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1213440., grad_fn=<MseLossBackward>)
output :  tensor([[140657.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(3774641.7500, grad_fn=<MseLossBackward>)
output :  tensor([[177111.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5691e+09, grad_fn=<MseLossBackward>)
output :  tensor([[143827.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(29874.9609, grad_fn=<MseLossBackward>)
output :  tensor([[160824.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(679439.5625, grad_fn=<MseLossBackward>)
output :  tensor([[213829.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1369924., grad_fn=<MseLossBackward>)
output :  tensor([[135309.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(9.1866e+08, grad_fn=<MseLossBackward>)
output :  tensor([[256149.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1321925., grad_fn=<MseLossBackward>)
output :  tensor([[156046.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(11923641., grad_fn=<MseLossBackward>)
output :  tensor([[127270.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(1511766.2500, grad_fn=<MseLossBackward>)
output :  tensor([[95539.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(291372.2188, grad_fn=<MseLossBackward>)
output :  tensor([[151368.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4714e+09, grad_fn=<MseLossBackward>)
output :  tensor([[177187.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(7359351.5000, grad_fn=<MseLossBackward>)
output :  tensor([[123345.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(8095092., grad_fn=<MseLossBackward>)
output :  tensor([[195111.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1451e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144130.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1771e+09, grad_fn=<MseLossBackward>)
output :  tensor([[149713.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(34741.4648, grad_fn=<MseLossBackward>)
output :  tensor([[189641.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(3577003.7500, grad_fn=<MseLossBackward>)
output :  tensor([[256287.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3535e+09, grad_fn=<MseLossBackward>)
output :  tensor([[89503.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(3987260.2500, grad_fn=<MseLossBackward>)
output :  tensor([[240782.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(612232.8750, grad_fn=<MseLossBackward>)
output :  tensor([[131482.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(8896238., grad_fn=<MseLossBackward>)
output :  tensor([[163943.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0395e+10, grad_fn=<MseLossBackward>)
output :  tensor([[113655.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8648e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179102.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(9623761., grad_fn=<MseLossBackward>)
output :  tensor([[162828.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4888e+08, grad_fn=<MseLossBackward>)
output :  tensor([[153588.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3309e+08, grad_fn=<MseLossBackward>)
output :  tensor([[239519.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(270107.5938, grad_fn=<MseLossBackward>)
output :  tensor([[226903.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6699e+08, grad_fn=<MseLossBackward>)
output :  tensor([[127009.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(87.8906, grad_fn=<MseLossBackward>)
output :  tensor([[129642.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(13265757., grad_fn=<MseLossBackward>)
output :  tensor([[226717.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(79806.2500, grad_fn=<MseLossBackward>)
output :  tensor([[229152.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(23499468., grad_fn=<MseLossBackward>)
output :  tensor([[227280.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(337125.3750, grad_fn=<MseLossBackward>)
output :  tensor([[147067.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(869585.3750, grad_fn=<MseLossBackward>)
output :  tensor([[203439.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(43040980., grad_fn=<MseLossBackward>)
output :  tensor([[128714.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(75943872., grad_fn=<MseLossBackward>)
output :  tensor([[135488.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(8930945., grad_fn=<MseLossBackward>)
output :  tensor([[311639.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(11291910., grad_fn=<MseLossBackward>)
output :  tensor([[141285.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(81447.8125, grad_fn=<MseLossBackward>)
output :  tensor([[122448.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0745e+09, grad_fn=<MseLossBackward>)
output :  tensor([[109952.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(205039.1562, grad_fn=<MseLossBackward>)
output :  tensor([[156047.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7069e+08, grad_fn=<MseLossBackward>)
output :  tensor([[182097.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(8.5798e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173695.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(483676.7812, grad_fn=<MseLossBackward>)
output :  tensor([[196442.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(20768670., grad_fn=<MseLossBackward>)
output :  tensor([[93347.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(44262304., grad_fn=<MseLossBackward>)
output :  tensor([[177978.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1042728.1875, grad_fn=<MseLossBackward>)
output :  tensor([[170673.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(7693255.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138206.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(629196., grad_fn=<MseLossBackward>)
output :  tensor([[265481.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7645e+09, grad_fn=<MseLossBackward>)
output :  tensor([[141432.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1846e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174175.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1381837., grad_fn=<MseLossBackward>)
output :  tensor([[139664.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(112654.6328, grad_fn=<MseLossBackward>)
output :  tensor([[203729.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(10431487., grad_fn=<MseLossBackward>)
output :  tensor([[170066.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(4445.1387, grad_fn=<MseLossBackward>)
output :  tensor([[241144.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(8152095.5000, grad_fn=<MseLossBackward>)
output :  tensor([[134104.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(156519.1406, grad_fn=<MseLossBackward>)
output :  tensor([[150243.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(798872.8750, grad_fn=<MseLossBackward>)
output :  tensor([[214196.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(646215., grad_fn=<MseLossBackward>)
output :  tensor([[167462.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(6065368.5000, grad_fn=<MseLossBackward>)
output :  tensor([[188446.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(306275.7812, grad_fn=<MseLossBackward>)
output :  tensor([[132624.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9569e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128278.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(519874.8125, grad_fn=<MseLossBackward>)
output :  tensor([[139069.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(865016.2500, grad_fn=<MseLossBackward>)
output :  tensor([[206361.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9865e+09, grad_fn=<MseLossBackward>)
output :  tensor([[165905.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5913e+09, grad_fn=<MseLossBackward>)
output :  tensor([[74453.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0892e+08, grad_fn=<MseLossBackward>)
output :  tensor([[93671.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(84121568., grad_fn=<MseLossBackward>)
output :  tensor([[251873.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(2016178.1250, grad_fn=<MseLossBackward>)
output :  tensor([[202709.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0589e+09, grad_fn=<MseLossBackward>)
output :  tensor([[114265.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(539547.6250, grad_fn=<MseLossBackward>)
output :  tensor([[155691.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0118e+09, grad_fn=<MseLossBackward>)
output :  tensor([[209260.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1533e+08, grad_fn=<MseLossBackward>)
output :  tensor([[182484.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6589e+09, grad_fn=<MseLossBackward>)
output :  tensor([[156998.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3995438.7500, grad_fn=<MseLossBackward>)
output :  tensor([[170806.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(650971.6250, grad_fn=<MseLossBackward>)
output :  tensor([[116257.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(1580893.6250, grad_fn=<MseLossBackward>)
output :  tensor([[159670.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(21812548., grad_fn=<MseLossBackward>)
output :  tensor([[192640.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0332e+08, grad_fn=<MseLossBackward>)
output :  tensor([[220323.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(677740.5625, grad_fn=<MseLossBackward>)
output :  tensor([[247716.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4729e+11, grad_fn=<MseLossBackward>)
output :  tensor([[149038.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(4155546., grad_fn=<MseLossBackward>)
output :  tensor([[112537.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(16461278., grad_fn=<MseLossBackward>)
output :  tensor([[168879.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6952e+08, grad_fn=<MseLossBackward>)
output :  tensor([[157347.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(46887188., grad_fn=<MseLossBackward>)
output :  tensor([[236086.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(834567.8750, grad_fn=<MseLossBackward>)
output :  tensor([[115462.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(213494.5312, grad_fn=<MseLossBackward>)
output :  tensor([[184402.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(2256896., grad_fn=<MseLossBackward>)
output :  tensor([[188820.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(4495659., grad_fn=<MseLossBackward>)
output :  tensor([[163767.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4409e+10, grad_fn=<MseLossBackward>)
output :  tensor([[94527.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8300e+08, grad_fn=<MseLossBackward>)
output :  tensor([[238424.]], grad_fn=<AddmmBackward>)
loss:  tensor(331776., grad_fn=<MseLossBackward>)
output :  tensor([[175942.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(3320.6406, grad_fn=<MseLossBackward>)
output :  tensor([[138579.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2018175.3750, grad_fn=<MseLossBackward>)
output :  tensor([[235548.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(300817.9688, grad_fn=<MseLossBackward>)
output :  tensor([[161177.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(3320766., grad_fn=<MseLossBackward>)
output :  tensor([[205467.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4288e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134321.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(460786.4062, grad_fn=<MseLossBackward>)
output :  tensor([[186892.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1965e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136794.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(631279.9375, grad_fn=<MseLossBackward>)
output :  tensor([[229085.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(47809664., grad_fn=<MseLossBackward>)
output :  tensor([[230046.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9815e+08, grad_fn=<MseLossBackward>)
output :  tensor([[89034.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(931390.8750, grad_fn=<MseLossBackward>)
output :  tensor([[160028.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(353746.1562, grad_fn=<MseLossBackward>)
output :  tensor([[247619.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5193e+10, grad_fn=<MseLossBackward>)
output :  tensor([[147549.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(6497879., grad_fn=<MseLossBackward>)
output :  tensor([[106647.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5719e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164233.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(71138.8906, grad_fn=<MseLossBackward>)
output :  tensor([[143727.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(74145.5859, grad_fn=<MseLossBackward>)
output :  tensor([[128584.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(147780.1719, grad_fn=<MseLossBackward>)
output :  tensor([[189714.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8004e+09, grad_fn=<MseLossBackward>)
output :  tensor([[122179.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(102450.0078, grad_fn=<MseLossBackward>)
output :  tensor([[151142.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(735815.5000, grad_fn=<MseLossBackward>)
output :  tensor([[169814.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(3746886., grad_fn=<MseLossBackward>)
output :  tensor([[148690.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(5333718., grad_fn=<MseLossBackward>)
output :  tensor([[159531.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(11348898., grad_fn=<MseLossBackward>)
output :  tensor([[135657.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1064e+08, grad_fn=<MseLossBackward>)
output :  tensor([[131941.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(3382.1494, grad_fn=<MseLossBackward>)
output :  tensor([[153748.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1752e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148305.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(17247798., grad_fn=<MseLossBackward>)
output :  tensor([[164970.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(10373130., grad_fn=<MseLossBackward>)
output :  tensor([[134612.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1072e+08, grad_fn=<MseLossBackward>)
output :  tensor([[151439.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(6967207.5000, grad_fn=<MseLossBackward>)
output :  tensor([[185183.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(7930472., grad_fn=<MseLossBackward>)
output :  tensor([[169105.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(11133.5469, grad_fn=<MseLossBackward>)
output :  tensor([[180091.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(8441.0156, grad_fn=<MseLossBackward>)
output :  tensor([[220942.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(888541.8750, grad_fn=<MseLossBackward>)
output :  tensor([[110470.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(6608072.5000, grad_fn=<MseLossBackward>)
output :  tensor([[134148.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(85533016., grad_fn=<MseLossBackward>)
output :  tensor([[285894.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(11216.1338, grad_fn=<MseLossBackward>)
output :  tensor([[116865.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(749063.1875, grad_fn=<MseLossBackward>)
output :  tensor([[177882.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7739e+09, grad_fn=<MseLossBackward>)
output :  tensor([[185540.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(292495.0625, grad_fn=<MseLossBackward>)
output :  tensor([[179495.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(36057396., grad_fn=<MseLossBackward>)
output :  tensor([[250074.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2126e+08, grad_fn=<MseLossBackward>)
output :  tensor([[222845.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(714738.1250, grad_fn=<MseLossBackward>)
output :  tensor([[120966.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2699e+08, grad_fn=<MseLossBackward>)
output :  tensor([[171800.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5347e+08, grad_fn=<MseLossBackward>)
output :  tensor([[124190.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(36296.2031, grad_fn=<MseLossBackward>)
output :  tensor([[185571.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4114e+10, grad_fn=<MseLossBackward>)
output :  tensor([[150726.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(5168376., grad_fn=<MseLossBackward>)
output :  tensor([[153041.]], grad_fn=<AddmmBackward>)
loss:  tensor(42784680., grad_fn=<MseLossBackward>)
output :  tensor([[204304.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(3982456.7500, grad_fn=<MseLossBackward>)
output :  tensor([[147394.]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2183e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174140.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(3456520., grad_fn=<MseLossBackward>)
output :  tensor([[252713.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1751e+08, grad_fn=<MseLossBackward>)
output :  tensor([[146865.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1286416.7500, grad_fn=<MseLossBackward>)
output :  tensor([[200478.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(4780372.5000, grad_fn=<MseLossBackward>)
output :  tensor([[155925.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(16198361., grad_fn=<MseLossBackward>)
output :  tensor([[123302.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2463e+09, grad_fn=<MseLossBackward>)
output :  tensor([[131490.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(18139480., grad_fn=<MseLossBackward>)
output :  tensor([[183381.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(382387.6250, grad_fn=<MseLossBackward>)
output :  tensor([[194540.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(20617418., grad_fn=<MseLossBackward>)
output :  tensor([[238203.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5803e+09, grad_fn=<MseLossBackward>)
output :  tensor([[254465.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(6424799., grad_fn=<MseLossBackward>)
output :  tensor([[189189.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6851e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143649.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7196e+09, grad_fn=<MseLossBackward>)
output :  tensor([[153396.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(79152720., grad_fn=<MseLossBackward>)
output :  tensor([[71473.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9057e+08, grad_fn=<MseLossBackward>)
output :  tensor([[125964.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(81648448., grad_fn=<MseLossBackward>)
output :  tensor([[132223.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(11042744., grad_fn=<MseLossBackward>)
output :  tensor([[152723.]], grad_fn=<AddmmBackward>)
loss:  tensor(1630729., grad_fn=<MseLossBackward>)
output :  tensor([[128281.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1641961.8750, grad_fn=<MseLossBackward>)
output :  tensor([[81557.]], grad_fn=<AddmmBackward>)
loss:  tensor(25573248., grad_fn=<MseLossBackward>)
output :  tensor([[83102.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(1214972.2500, grad_fn=<MseLossBackward>)
output :  tensor([[219746.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5015e+08, grad_fn=<MseLossBackward>)
output :  tensor([[139900.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5078e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134090.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(12891241., grad_fn=<MseLossBackward>)
output :  tensor([[167543.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(295171.5000, grad_fn=<MseLossBackward>)
output :  tensor([[237469.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(6098507.5000, grad_fn=<MseLossBackward>)
output :  tensor([[189614.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(6377913.5000, grad_fn=<MseLossBackward>)
output :  tensor([[156475.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(226486.7656, grad_fn=<MseLossBackward>)
output :  tensor([[196536.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1860325.5000, grad_fn=<MseLossBackward>)
output :  tensor([[209722.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4405e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137062.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(3965.0635, grad_fn=<MseLossBackward>)
output :  tensor([[155290.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(84471.9766, grad_fn=<MseLossBackward>)
output :  tensor([[133500.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(6248984.5000, grad_fn=<MseLossBackward>)
output :  tensor([[203879.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(6.8227e+08, grad_fn=<MseLossBackward>)
output :  tensor([[156059.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(4241926.5000, grad_fn=<MseLossBackward>)
output :  tensor([[136392.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8398e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145817.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(841806.2500, grad_fn=<MseLossBackward>)
output :  tensor([[208242.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(14118571., grad_fn=<MseLossBackward>)
output :  tensor([[99667.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1214e+08, grad_fn=<MseLossBackward>)
output :  tensor([[169860.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(5570116.5000, grad_fn=<MseLossBackward>)
output :  tensor([[132367.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(19072872., grad_fn=<MseLossBackward>)
output :  tensor([[146857.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(20377.5625, grad_fn=<MseLossBackward>)
output :  tensor([[104424.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7675e+09, grad_fn=<MseLossBackward>)
output :  tensor([[138086.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(344403.9375, grad_fn=<MseLossBackward>)
output :  tensor([[232782.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(10353815., grad_fn=<MseLossBackward>)
output :  tensor([[145594.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(353188.7812, grad_fn=<MseLossBackward>)
output :  tensor([[140680.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(10116674., grad_fn=<MseLossBackward>)
output :  tensor([[165456.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4030e+09, grad_fn=<MseLossBackward>)
output :  tensor([[274640.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(11287500., grad_fn=<MseLossBackward>)
output :  tensor([[169421.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(31114606., grad_fn=<MseLossBackward>)
output :  tensor([[103704.1016]], grad_fn=<AddmmBackward>)
loss:  tensor(861372.5000, grad_fn=<MseLossBackward>)
output :  tensor([[203507.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4749e+09, grad_fn=<MseLossBackward>)
output :  tensor([[154857.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(17162766., grad_fn=<MseLossBackward>)
output :  tensor([[163962.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5566e+10, grad_fn=<MseLossBackward>)
output :  tensor([[102302.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(16023946., grad_fn=<MseLossBackward>)
output :  tensor([[124400.0547]], grad_fn=<AddmmBackward>)
loss:  tensor(640087.5000, grad_fn=<MseLossBackward>)
output :  tensor([[157008.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1017072.2500, grad_fn=<MseLossBackward>)
output :  tensor([[143222.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(10386923., grad_fn=<MseLossBackward>)
output :  tensor([[200844.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(712520.6250, grad_fn=<MseLossBackward>)
output :  tensor([[141015.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(969178.7500, grad_fn=<MseLossBackward>)
output :  tensor([[256760.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(30459534., grad_fn=<MseLossBackward>)
output :  tensor([[127335.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1789e+09, grad_fn=<MseLossBackward>)
output :  tensor([[162046.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(11925799., grad_fn=<MseLossBackward>)
output :  tensor([[187005.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2234557.7500, grad_fn=<MseLossBackward>)
output :  tensor([[122465.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5539e+08, grad_fn=<MseLossBackward>)
output :  tensor([[248281.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2952705.2500, grad_fn=<MseLossBackward>)
output :  tensor([[158428.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1635e+08, grad_fn=<MseLossBackward>)
output :  tensor([[240697.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(21647792., grad_fn=<MseLossBackward>)
output :  tensor([[146124.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4515359.5000, grad_fn=<MseLossBackward>)
output :  tensor([[213378.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(11415740., grad_fn=<MseLossBackward>)
output :  tensor([[176803.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(19393426., grad_fn=<MseLossBackward>)
output :  tensor([[154316.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(100053.5938, grad_fn=<MseLossBackward>)
output :  tensor([[119702.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2900049.2500, grad_fn=<MseLossBackward>)
output :  tensor([[237190.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4899e+09, grad_fn=<MseLossBackward>)
output :  tensor([[238467.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2347933.7500, grad_fn=<MseLossBackward>)
output :  tensor([[151050.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(5226296., grad_fn=<MseLossBackward>)
output :  tensor([[255317.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(173915.0625, grad_fn=<MseLossBackward>)
output :  tensor([[121414.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(47755120., grad_fn=<MseLossBackward>)
output :  tensor([[176928.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(862257.3125, grad_fn=<MseLossBackward>)
output :  tensor([[159455.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(296072., grad_fn=<MseLossBackward>)
output :  tensor([[135578.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(20958370., grad_fn=<MseLossBackward>)
output :  tensor([[191228.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8105e+09, grad_fn=<MseLossBackward>)
output :  tensor([[162850.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1321027., grad_fn=<MseLossBackward>)
output :  tensor([[164057.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1119033.3750, grad_fn=<MseLossBackward>)
output :  tensor([[156057.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3771667.5000, grad_fn=<MseLossBackward>)
output :  tensor([[147480.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(5855265.5000, grad_fn=<MseLossBackward>)
output :  tensor([[169764.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3.6318e+09, grad_fn=<MseLossBackward>)
output :  tensor([[156797.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(10253504., grad_fn=<MseLossBackward>)
output :  tensor([[379734.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(17942902., grad_fn=<MseLossBackward>)
output :  tensor([[124733.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(5137447., grad_fn=<MseLossBackward>)
output :  tensor([[128895.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8832e+09, grad_fn=<MseLossBackward>)
output :  tensor([[277772.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(11838976., grad_fn=<MseLossBackward>)
output :  tensor([[164832.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(8022525., grad_fn=<MseLossBackward>)
output :  tensor([[129600.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(82810424., grad_fn=<MseLossBackward>)
output :  tensor([[234185.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(4776137., grad_fn=<MseLossBackward>)
output :  tensor([[179991.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(258476.9219, grad_fn=<MseLossBackward>)
output :  tensor([[153191.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1418667.1250, grad_fn=<MseLossBackward>)
output :  tensor([[144278.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(519931.1250, grad_fn=<MseLossBackward>)
output :  tensor([[152029.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2889e+08, grad_fn=<MseLossBackward>)
output :  tensor([[102563.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(6572533.5000, grad_fn=<MseLossBackward>)
output :  tensor([[68533.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(72817952., grad_fn=<MseLossBackward>)
output :  tensor([[166117.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1247793.7500, grad_fn=<MseLossBackward>)
output :  tensor([[188957.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5243e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163906.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(34891172., grad_fn=<MseLossBackward>)
output :  tensor([[151338.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(37959652., grad_fn=<MseLossBackward>)
output :  tensor([[138886.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2064699.6250, grad_fn=<MseLossBackward>)
output :  tensor([[206636.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(470681.7500, grad_fn=<MseLossBackward>)
output :  tensor([[139611.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(2596378.2500, grad_fn=<MseLossBackward>)
output :  tensor([[182906.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6153e+10, grad_fn=<MseLossBackward>)
output :  tensor([[150447.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(19775948., grad_fn=<MseLossBackward>)
output :  tensor([[108208.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3549e+08, grad_fn=<MseLossBackward>)
output :  tensor([[95565.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2450007.5000, grad_fn=<MseLossBackward>)
output :  tensor([[174233.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(587306.6875, grad_fn=<MseLossBackward>)
output :  tensor([[261045.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(416629.9062, grad_fn=<MseLossBackward>)
output :  tensor([[140547.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(907792.1250, grad_fn=<MseLossBackward>)
output :  tensor([[157011.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(8316464.5000, grad_fn=<MseLossBackward>)
output :  tensor([[131806.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(481484.1875, grad_fn=<MseLossBackward>)
output :  tensor([[150074.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(329601.5625, grad_fn=<MseLossBackward>)
output :  tensor([[168467.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(322428.7812, grad_fn=<MseLossBackward>)
output :  tensor([[128323.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1752438.1250, grad_fn=<MseLossBackward>)
output :  tensor([[170315.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4085e+08, grad_fn=<MseLossBackward>)
output :  tensor([[158649.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2721005., grad_fn=<MseLossBackward>)
output :  tensor([[118079.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2494820.2500, grad_fn=<MseLossBackward>)
output :  tensor([[159457.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4084e+09, grad_fn=<MseLossBackward>)
output :  tensor([[50926.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1152872., grad_fn=<MseLossBackward>)
output :  tensor([[232097.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4645e+09, grad_fn=<MseLossBackward>)
output :  tensor([[196931.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(16551548., grad_fn=<MseLossBackward>)
output :  tensor([[187679.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(7181395., grad_fn=<MseLossBackward>)
output :  tensor([[108047.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(4191520.5000, grad_fn=<MseLossBackward>)
output :  tensor([[87544.1016]], grad_fn=<AddmmBackward>)
loss:  tensor(296046.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139696.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(92169.1641, grad_fn=<MseLossBackward>)
output :  tensor([[224339.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8525e+09, grad_fn=<MseLossBackward>)
output :  tensor([[206563.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(876417.7500, grad_fn=<MseLossBackward>)
output :  tensor([[168810.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(14520506., grad_fn=<MseLossBackward>)
output :  tensor([[174452.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(8.1989e+09, grad_fn=<MseLossBackward>)
output :  tensor([[188095.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(3628489.2500, grad_fn=<MseLossBackward>)
output :  tensor([[87568.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(322766., grad_fn=<MseLossBackward>)
output :  tensor([[140508.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(259065.0938, grad_fn=<MseLossBackward>)
output :  tensor([[109755.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(554070.8750, grad_fn=<MseLossBackward>)
output :  tensor([[147042.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2282e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173238.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7841e+09, grad_fn=<MseLossBackward>)
output :  tensor([[196376.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(74365288., grad_fn=<MseLossBackward>)
output :  tensor([[177352.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(7008677., grad_fn=<MseLossBackward>)
output :  tensor([[98035.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(2358696., grad_fn=<MseLossBackward>)
output :  tensor([[118189.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(475442.5625, grad_fn=<MseLossBackward>)
output :  tensor([[162862.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4678e+08, grad_fn=<MseLossBackward>)
output :  tensor([[200437.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(191802.9375, grad_fn=<MseLossBackward>)
output :  tensor([[144970.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(942750., grad_fn=<MseLossBackward>)
train_loss: [2.5404964e+09]
epoch_result tensor([0.])
output :  tensor([[155045.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(11931411., grad_fn=<MseLossBackward>)
output :  tensor([[122292.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(85583.6719, grad_fn=<MseLossBackward>)
output :  tensor([[196879.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(7176120., grad_fn=<MseLossBackward>)
output :  tensor([[174640.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(5566208., grad_fn=<MseLossBackward>)
output :  tensor([[151129.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2201e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130288.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(5235945., grad_fn=<MseLossBackward>)
output :  tensor([[142031.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(1063669.8750, grad_fn=<MseLossBackward>)
output :  tensor([[118582.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(174254.0625, grad_fn=<MseLossBackward>)
output :  tensor([[64575.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(36907144., grad_fn=<MseLossBackward>)
output :  tensor([[166944.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(892995.5000, grad_fn=<MseLossBackward>)
output :  tensor([[133143.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(47004952., grad_fn=<MseLossBackward>)
output :  tensor([[225356.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(127092.2500, grad_fn=<MseLossBackward>)
output :  tensor([[166166.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(8026420., grad_fn=<MseLossBackward>)
output :  tensor([[246248.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(11911882., grad_fn=<MseLossBackward>)
output :  tensor([[55187.9492]], grad_fn=<AddmmBackward>)
loss:  tensor(35324.9102, grad_fn=<MseLossBackward>)
output :  tensor([[160020.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4089e+08, grad_fn=<MseLossBackward>)
output :  tensor([[167373.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(58158020., grad_fn=<MseLossBackward>)
output :  tensor([[151031.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(29908594., grad_fn=<MseLossBackward>)
output :  tensor([[275207.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(43238.0039, grad_fn=<MseLossBackward>)
output :  tensor([[198119.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1253595.1250, grad_fn=<MseLossBackward>)
output :  tensor([[139544.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4505e+10, grad_fn=<MseLossBackward>)
output :  tensor([[193302.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(331992.0312, grad_fn=<MseLossBackward>)
output :  tensor([[180355.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9842e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151238.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(56919.5234, grad_fn=<MseLossBackward>)
output :  tensor([[170061.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3834.3186, grad_fn=<MseLossBackward>)
output :  tensor([[86608.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(1460717.7500, grad_fn=<MseLossBackward>)
output :  tensor([[171317.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4010e+09, grad_fn=<MseLossBackward>)
output :  tensor([[180784.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(17772022., grad_fn=<MseLossBackward>)
output :  tensor([[208518.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2073e+09, grad_fn=<MseLossBackward>)
output :  tensor([[110364.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(132848.8594, grad_fn=<MseLossBackward>)
output :  tensor([[169405.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(2540885.7500, grad_fn=<MseLossBackward>)
output :  tensor([[135176.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1752520.8750, grad_fn=<MseLossBackward>)
output :  tensor([[130228.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(1509077.8750, grad_fn=<MseLossBackward>)
output :  tensor([[118268.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1516861.6250, grad_fn=<MseLossBackward>)
output :  tensor([[144781.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7179e+08, grad_fn=<MseLossBackward>)
output :  tensor([[168921.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1339e+10, grad_fn=<MseLossBackward>)
output :  tensor([[146818.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(8303672.5000, grad_fn=<MseLossBackward>)
output :  tensor([[180658.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(433663.4062, grad_fn=<MseLossBackward>)
output :  tensor([[143292.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(5255914.5000, grad_fn=<MseLossBackward>)
output :  tensor([[108334.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3616e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134282.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5154e+09, grad_fn=<MseLossBackward>)
output :  tensor([[130407.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(21092348., grad_fn=<MseLossBackward>)
output :  tensor([[134614.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(57978232., grad_fn=<MseLossBackward>)
output :  tensor([[226468.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2156584., grad_fn=<MseLossBackward>)
output :  tensor([[130926.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(1751776.3750, grad_fn=<MseLossBackward>)
output :  tensor([[155255.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(39133628., grad_fn=<MseLossBackward>)
output :  tensor([[115102.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(9627736., grad_fn=<MseLossBackward>)
output :  tensor([[159145.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(729422.7500, grad_fn=<MseLossBackward>)
output :  tensor([[148744.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1395e+09, grad_fn=<MseLossBackward>)
output :  tensor([[191219.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(608741.3125, grad_fn=<MseLossBackward>)
output :  tensor([[134358.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(8300.9180, grad_fn=<MseLossBackward>)
output :  tensor([[112452.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(6014488., grad_fn=<MseLossBackward>)
output :  tensor([[233224.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(601666.8750, grad_fn=<MseLossBackward>)
output :  tensor([[168209.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0503e+09, grad_fn=<MseLossBackward>)
output :  tensor([[157937.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1128142.7500, grad_fn=<MseLossBackward>)
output :  tensor([[206814.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7452e+10, grad_fn=<MseLossBackward>)
output :  tensor([[247177.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1411e+10, grad_fn=<MseLossBackward>)
output :  tensor([[146712.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(10317245., grad_fn=<MseLossBackward>)
output :  tensor([[137757.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(14121272., grad_fn=<MseLossBackward>)
output :  tensor([[152973.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(4108285.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135337.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(28485236., grad_fn=<MseLossBackward>)
output :  tensor([[178399.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6586e+09, grad_fn=<MseLossBackward>)
output :  tensor([[182855.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(1548274.7500, grad_fn=<MseLossBackward>)
output :  tensor([[161833.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(111118.0547, grad_fn=<MseLossBackward>)
output :  tensor([[134853.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(66362152., grad_fn=<MseLossBackward>)
output :  tensor([[143005.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(255482.8594, grad_fn=<MseLossBackward>)
output :  tensor([[147841.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(8071458.5000, grad_fn=<MseLossBackward>)
output :  tensor([[176041.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0506e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195702.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5357e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136872.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(139070.7188, grad_fn=<MseLossBackward>)
output :  tensor([[171313.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(344330.5625, grad_fn=<MseLossBackward>)
output :  tensor([[176202.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(23014058., grad_fn=<MseLossBackward>)
output :  tensor([[116838.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(3380685.5000, grad_fn=<MseLossBackward>)
output :  tensor([[216097.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(24034354., grad_fn=<MseLossBackward>)
output :  tensor([[189843.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(40239796., grad_fn=<MseLossBackward>)
output :  tensor([[128432.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(8597632., grad_fn=<MseLossBackward>)
output :  tensor([[196080.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(175836.0781, grad_fn=<MseLossBackward>)
output :  tensor([[176284.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1916840.2500, grad_fn=<MseLossBackward>)
output :  tensor([[212305.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0257e+10, grad_fn=<MseLossBackward>)
output :  tensor([[209076.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(3700393.2500, grad_fn=<MseLossBackward>)
output :  tensor([[162506.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(9.9265e+08, grad_fn=<MseLossBackward>)
output :  tensor([[193775.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(524357., grad_fn=<MseLossBackward>)
output :  tensor([[111138.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(3464804.2500, grad_fn=<MseLossBackward>)
output :  tensor([[116047.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(12584147., grad_fn=<MseLossBackward>)
output :  tensor([[112394.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(155661.0781, grad_fn=<MseLossBackward>)
output :  tensor([[146352.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(199934.7344, grad_fn=<MseLossBackward>)
output :  tensor([[162288.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2528e+10, grad_fn=<MseLossBackward>)
output :  tensor([[180765.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(585655.3750, grad_fn=<MseLossBackward>)
output :  tensor([[128501.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(1002079.1875, grad_fn=<MseLossBackward>)
output :  tensor([[142820.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(4750697., grad_fn=<MseLossBackward>)
output :  tensor([[182121.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2298e+09, grad_fn=<MseLossBackward>)
output :  tensor([[116017.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(779206.1875, grad_fn=<MseLossBackward>)
output :  tensor([[189691.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(53407320., grad_fn=<MseLossBackward>)
output :  tensor([[142996.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(4013448.7500, grad_fn=<MseLossBackward>)
output :  tensor([[212165.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(539490.2500, grad_fn=<MseLossBackward>)
output :  tensor([[127183.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1399636.8750, grad_fn=<MseLossBackward>)
output :  tensor([[253057.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(22365362., grad_fn=<MseLossBackward>)
output :  tensor([[244813.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6149e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146826.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3798e+08, grad_fn=<MseLossBackward>)
output :  tensor([[88317.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4627e+08, grad_fn=<MseLossBackward>)
output :  tensor([[196375.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1661e+09, grad_fn=<MseLossBackward>)
output :  tensor([[84367.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(11342372., grad_fn=<MseLossBackward>)
output :  tensor([[140283.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(613431.6250, grad_fn=<MseLossBackward>)
output :  tensor([[78848.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(11212557., grad_fn=<MseLossBackward>)
output :  tensor([[142502.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(202542.1875, grad_fn=<MseLossBackward>)
output :  tensor([[172625.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(11389570., grad_fn=<MseLossBackward>)
output :  tensor([[155360.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3459716.2500, grad_fn=<MseLossBackward>)
output :  tensor([[108812.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1993876.3750, grad_fn=<MseLossBackward>)
output :  tensor([[204158.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2453e+10, grad_fn=<MseLossBackward>)
output :  tensor([[128128.9141]], grad_fn=<AddmmBackward>)
loss:  tensor(137704.7656, grad_fn=<MseLossBackward>)
output :  tensor([[269906.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0187e+08, grad_fn=<MseLossBackward>)
output :  tensor([[299299.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1450e+08, grad_fn=<MseLossBackward>)
output :  tensor([[107167.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(110488.7188, grad_fn=<MseLossBackward>)
output :  tensor([[173339.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(704261.8750, grad_fn=<MseLossBackward>)
output :  tensor([[135000.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2905e+08, grad_fn=<MseLossBackward>)
output :  tensor([[144735.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(32893452., grad_fn=<MseLossBackward>)
output :  tensor([[129960.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(83642.9688, grad_fn=<MseLossBackward>)
output :  tensor([[124684.0234]], grad_fn=<AddmmBackward>)
loss:  tensor(99841.1875, grad_fn=<MseLossBackward>)
output :  tensor([[133743.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8775e+08, grad_fn=<MseLossBackward>)
output :  tensor([[224213.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9516e+10, grad_fn=<MseLossBackward>)
output :  tensor([[193883.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1643e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143365.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(285907.4375, grad_fn=<MseLossBackward>)
output :  tensor([[133754.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(39118772., grad_fn=<MseLossBackward>)
output :  tensor([[114285.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(9213169., grad_fn=<MseLossBackward>)
output :  tensor([[258397.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5597e+09, grad_fn=<MseLossBackward>)
output :  tensor([[135424.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(179895.2656, grad_fn=<MseLossBackward>)
output :  tensor([[203452.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(204713.8281, grad_fn=<MseLossBackward>)
output :  tensor([[100388.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(20353138., grad_fn=<MseLossBackward>)
output :  tensor([[138955.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(989620.8125, grad_fn=<MseLossBackward>)
output :  tensor([[210702.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9037e+08, grad_fn=<MseLossBackward>)
output :  tensor([[183800.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(15217557., grad_fn=<MseLossBackward>)
output :  tensor([[184278.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(520201.5625, grad_fn=<MseLossBackward>)
output :  tensor([[163061.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1298e+10, grad_fn=<MseLossBackward>)
output :  tensor([[304522.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2886e+08, grad_fn=<MseLossBackward>)
output :  tensor([[197905.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(30.4221, grad_fn=<MseLossBackward>)
output :  tensor([[262342.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9746e+10, grad_fn=<MseLossBackward>)
output :  tensor([[227652.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4705e+09, grad_fn=<MseLossBackward>)
output :  tensor([[289519.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5520e+08, grad_fn=<MseLossBackward>)
output :  tensor([[227233.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(10455825., grad_fn=<MseLossBackward>)
output :  tensor([[220879.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9282e+10, grad_fn=<MseLossBackward>)
output :  tensor([[194748.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(5069604., grad_fn=<MseLossBackward>)
output :  tensor([[157907.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3566e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135527.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(9163959., grad_fn=<MseLossBackward>)
output :  tensor([[135502.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(8.7209, grad_fn=<MseLossBackward>)
output :  tensor([[90777.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(49551.4570, grad_fn=<MseLossBackward>)
output :  tensor([[108373.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(139263.0781, grad_fn=<MseLossBackward>)
output :  tensor([[275104.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8940e+09, grad_fn=<MseLossBackward>)
output :  tensor([[234332.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(445326.8125, grad_fn=<MseLossBackward>)
output :  tensor([[147912.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(8480199., grad_fn=<MseLossBackward>)
output :  tensor([[138960.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2131737., grad_fn=<MseLossBackward>)
output :  tensor([[173685.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2220.7656, grad_fn=<MseLossBackward>)
output :  tensor([[143492.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(3087488.2500, grad_fn=<MseLossBackward>)
output :  tensor([[166134.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(8.0460e+08, grad_fn=<MseLossBackward>)
output :  tensor([[167357.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(5559132.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135385.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2607064.2500, grad_fn=<MseLossBackward>)
output :  tensor([[188450.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3494e+09, grad_fn=<MseLossBackward>)
output :  tensor([[114277.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(5189213., grad_fn=<MseLossBackward>)
output :  tensor([[172664.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(442204.2188, grad_fn=<MseLossBackward>)
output :  tensor([[116989.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(9062875., grad_fn=<MseLossBackward>)
output :  tensor([[87182.8359]], grad_fn=<AddmmBackward>)
loss:  tensor(33428.9805, grad_fn=<MseLossBackward>)
output :  tensor([[179955.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1971.9150, grad_fn=<MseLossBackward>)
output :  tensor([[110444.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(296658.9375, grad_fn=<MseLossBackward>)
output :  tensor([[242258.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(10619757., grad_fn=<MseLossBackward>)
output :  tensor([[249046.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(16372645., grad_fn=<MseLossBackward>)
output :  tensor([[134018.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(20413454., grad_fn=<MseLossBackward>)
output :  tensor([[109857.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(806656.5625, grad_fn=<MseLossBackward>)
output :  tensor([[288398.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2128e+10, grad_fn=<MseLossBackward>)
output :  tensor([[172843.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1805160.2500, grad_fn=<MseLossBackward>)
output :  tensor([[129025.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(16206978., grad_fn=<MseLossBackward>)
output :  tensor([[141147.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3581e+08, grad_fn=<MseLossBackward>)
output :  tensor([[203515.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0993e+08, grad_fn=<MseLossBackward>)
output :  tensor([[141047.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2245.8713, grad_fn=<MseLossBackward>)
output :  tensor([[156696.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5204e+10, grad_fn=<MseLossBackward>)
output :  tensor([[162460.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(73284304., grad_fn=<MseLossBackward>)
output :  tensor([[130549.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1101056.7500, grad_fn=<MseLossBackward>)
output :  tensor([[254701.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5326e+10, grad_fn=<MseLossBackward>)
output :  tensor([[398732.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(10676148., grad_fn=<MseLossBackward>)
output :  tensor([[110742.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(3037259.2500, grad_fn=<MseLossBackward>)
output :  tensor([[109802.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(75641344., grad_fn=<MseLossBackward>)
output :  tensor([[155917.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(12835762., grad_fn=<MseLossBackward>)
output :  tensor([[128390.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5585e+08, grad_fn=<MseLossBackward>)
output :  tensor([[162515.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(3.5385e+09, grad_fn=<MseLossBackward>)
output :  tensor([[171600.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7947e+09, grad_fn=<MseLossBackward>)
output :  tensor([[101848.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(3066548.2500, grad_fn=<MseLossBackward>)
output :  tensor([[139501.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(2246673., grad_fn=<MseLossBackward>)
output :  tensor([[369496.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(4851832., grad_fn=<MseLossBackward>)
output :  tensor([[208457.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0742e+09, grad_fn=<MseLossBackward>)
output :  tensor([[178581.]], grad_fn=<AddmmBackward>)
loss:  tensor(9492561., grad_fn=<MseLossBackward>)
output :  tensor([[204449.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2401773.5000, grad_fn=<MseLossBackward>)
output :  tensor([[136899.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(4412888., grad_fn=<MseLossBackward>)
output :  tensor([[193929.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(325238.5312, grad_fn=<MseLossBackward>)
output :  tensor([[136249.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2652e+08, grad_fn=<MseLossBackward>)
output :  tensor([[179311.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2850346.2500, grad_fn=<MseLossBackward>)
output :  tensor([[240868.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1279231.7500, grad_fn=<MseLossBackward>)
output :  tensor([[174232.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(54063.5156, grad_fn=<MseLossBackward>)
output :  tensor([[111047.6953]], grad_fn=<AddmmBackward>)
loss:  tensor(9288447., grad_fn=<MseLossBackward>)
output :  tensor([[263396.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1355041.5000, grad_fn=<MseLossBackward>)
output :  tensor([[245964.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(16282486., grad_fn=<MseLossBackward>)
output :  tensor([[125811.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(7902248., grad_fn=<MseLossBackward>)
output :  tensor([[216473.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4254e+09, grad_fn=<MseLossBackward>)
output :  tensor([[304715.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2371e+08, grad_fn=<MseLossBackward>)
output :  tensor([[205184.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(3296097., grad_fn=<MseLossBackward>)
output :  tensor([[215995.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5377e+10, grad_fn=<MseLossBackward>)
output :  tensor([[159284.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1916061.5000, grad_fn=<MseLossBackward>)
output :  tensor([[167359.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(6919777., grad_fn=<MseLossBackward>)
output :  tensor([[160363.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(11774334., grad_fn=<MseLossBackward>)
output :  tensor([[170289.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(84036.5781, grad_fn=<MseLossBackward>)
output :  tensor([[239835.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9322e+08, grad_fn=<MseLossBackward>)
output :  tensor([[223926.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(30574680., grad_fn=<MseLossBackward>)
output :  tensor([[158996.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4392e+08, grad_fn=<MseLossBackward>)
output :  tensor([[124596.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2548812.2500, grad_fn=<MseLossBackward>)
output :  tensor([[175757.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1543418., grad_fn=<MseLossBackward>)
output :  tensor([[180791.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2741e+09, grad_fn=<MseLossBackward>)
output :  tensor([[209539.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4254e+10, grad_fn=<MseLossBackward>)
output :  tensor([[133986.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(198498.0938, grad_fn=<MseLossBackward>)
output :  tensor([[150432.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3132e+08, grad_fn=<MseLossBackward>)
output :  tensor([[274244.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(7595019.5000, grad_fn=<MseLossBackward>)
output :  tensor([[84912.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(7742.6250, grad_fn=<MseLossBackward>)
output :  tensor([[236539.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1525.8789, grad_fn=<MseLossBackward>)
output :  tensor([[262680.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0256e+11, grad_fn=<MseLossBackward>)
output :  tensor([[169196.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(645461.6250, grad_fn=<MseLossBackward>)
output :  tensor([[194630.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6297e+09, grad_fn=<MseLossBackward>)
output :  tensor([[153418.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2501488.2500, grad_fn=<MseLossBackward>)
output :  tensor([[208874.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7364e+09, grad_fn=<MseLossBackward>)
output :  tensor([[130716.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(2945272.7500, grad_fn=<MseLossBackward>)
output :  tensor([[147476.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(6131736.5000, grad_fn=<MseLossBackward>)
output :  tensor([[167994.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4998e+08, grad_fn=<MseLossBackward>)
output :  tensor([[183827.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(4089621.5000, grad_fn=<MseLossBackward>)
output :  tensor([[130477.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(20043668., grad_fn=<MseLossBackward>)
output :  tensor([[138526.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(4104866., grad_fn=<MseLossBackward>)
output :  tensor([[178688.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(32359922., grad_fn=<MseLossBackward>)
output :  tensor([[196171.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8975e+09, grad_fn=<MseLossBackward>)
output :  tensor([[238997.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(16022633., grad_fn=<MseLossBackward>)
output :  tensor([[154176.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(678589.8125, grad_fn=<MseLossBackward>)
output :  tensor([[198037.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(4150515., grad_fn=<MseLossBackward>)
output :  tensor([[160361.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6770e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178427.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1149887.6250, grad_fn=<MseLossBackward>)
output :  tensor([[178682.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1482306.2500, grad_fn=<MseLossBackward>)
output :  tensor([[96290.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(502869.3438, grad_fn=<MseLossBackward>)
output :  tensor([[172158.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1630e+10, grad_fn=<MseLossBackward>)
output :  tensor([[134408.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(349336.4062, grad_fn=<MseLossBackward>)
output :  tensor([[119972.6016]], grad_fn=<AddmmBackward>)
loss:  tensor(24726766., grad_fn=<MseLossBackward>)
output :  tensor([[169416.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(21011624., grad_fn=<MseLossBackward>)
output :  tensor([[84826.5391]], grad_fn=<AddmmBackward>)
loss:  tensor(30088.6973, grad_fn=<MseLossBackward>)
output :  tensor([[289983.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(266.0977, grad_fn=<MseLossBackward>)
output :  tensor([[166534.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2353252., grad_fn=<MseLossBackward>)
output :  tensor([[194434.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9247e+10, grad_fn=<MseLossBackward>)
output :  tensor([[249226.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7409e+08, grad_fn=<MseLossBackward>)
output :  tensor([[155523.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(20463184., grad_fn=<MseLossBackward>)
output :  tensor([[120840.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(9984069., grad_fn=<MseLossBackward>)
output :  tensor([[118055.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3402987.2500, grad_fn=<MseLossBackward>)
output :  tensor([[145825.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(9.5020e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174334.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(111702.1719, grad_fn=<MseLossBackward>)
output :  tensor([[110187.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6659e+08, grad_fn=<MseLossBackward>)
output :  tensor([[214404.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0732e+10, grad_fn=<MseLossBackward>)
output :  tensor([[236240.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(27665628., grad_fn=<MseLossBackward>)
output :  tensor([[255655.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9470e+10, grad_fn=<MseLossBackward>)
output :  tensor([[221332.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(3.1213e+08, grad_fn=<MseLossBackward>)
output :  tensor([[199276.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3508e+10, grad_fn=<MseLossBackward>)
output :  tensor([[192229.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(22372014., grad_fn=<MseLossBackward>)
output :  tensor([[209066.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(4.6571e+10, grad_fn=<MseLossBackward>)
output :  tensor([[193072.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0428e+10, grad_fn=<MseLossBackward>)
output :  tensor([[179279.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(290605.2188, grad_fn=<MseLossBackward>)
output :  tensor([[153287.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1658420.7500, grad_fn=<MseLossBackward>)
output :  tensor([[336003.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(992638.6250, grad_fn=<MseLossBackward>)
output :  tensor([[211303.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(484633.5312, grad_fn=<MseLossBackward>)
output :  tensor([[160405.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(164721.8281, grad_fn=<MseLossBackward>)
output :  tensor([[190943.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5560e+09, grad_fn=<MseLossBackward>)
output :  tensor([[108563.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(12701651., grad_fn=<MseLossBackward>)
output :  tensor([[278948.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6204e+10, grad_fn=<MseLossBackward>)
output :  tensor([[170390.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(12314507., grad_fn=<MseLossBackward>)
output :  tensor([[219630.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(37583988., grad_fn=<MseLossBackward>)
output :  tensor([[216439.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(20801580., grad_fn=<MseLossBackward>)
output :  tensor([[178237.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(926947.7500, grad_fn=<MseLossBackward>)
output :  tensor([[199460.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(5473406.5000, grad_fn=<MseLossBackward>)
output :  tensor([[157950.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(8705727., grad_fn=<MseLossBackward>)
output :  tensor([[146391.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1522e+09, grad_fn=<MseLossBackward>)
output :  tensor([[118374.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(15787.5303, grad_fn=<MseLossBackward>)
output :  tensor([[142662.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(7088407., grad_fn=<MseLossBackward>)
output :  tensor([[148884.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(13253.7656, grad_fn=<MseLossBackward>)
output :  tensor([[203443.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5514e+10, grad_fn=<MseLossBackward>)
output :  tensor([[161662.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(4674514.5000, grad_fn=<MseLossBackward>)
output :  tensor([[102218.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(7389817.5000, grad_fn=<MseLossBackward>)
output :  tensor([[228880.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2365e+08, grad_fn=<MseLossBackward>)
output :  tensor([[186140.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(4.2605e+08, grad_fn=<MseLossBackward>)
output :  tensor([[176456.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(802.4827, grad_fn=<MseLossBackward>)
output :  tensor([[82918.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(843211.7500, grad_fn=<MseLossBackward>)
output :  tensor([[128572.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(5195.2559, grad_fn=<MseLossBackward>)
output :  tensor([[216061.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(4248945., grad_fn=<MseLossBackward>)
output :  tensor([[144085.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(7318.2676, grad_fn=<MseLossBackward>)
output :  tensor([[133850.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(14828998., grad_fn=<MseLossBackward>)
output :  tensor([[146057.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(11951173., grad_fn=<MseLossBackward>)
output :  tensor([[176203.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4980e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144620.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(384981.4688, grad_fn=<MseLossBackward>)
output :  tensor([[162797.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(7826443.5000, grad_fn=<MseLossBackward>)
output :  tensor([[213775.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1499170.6250, grad_fn=<MseLossBackward>)
output :  tensor([[136228.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(9.7525e+08, grad_fn=<MseLossBackward>)
output :  tensor([[258597.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(12944030., grad_fn=<MseLossBackward>)
output :  tensor([[162254.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(7589250., grad_fn=<MseLossBackward>)
output :  tensor([[134271.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(33304982., grad_fn=<MseLossBackward>)
output :  tensor([[95065.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(4321.0078, grad_fn=<MseLossBackward>)
output :  tensor([[154046.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8367e+09, grad_fn=<MseLossBackward>)
output :  tensor([[177626.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(5169584., grad_fn=<MseLossBackward>)
output :  tensor([[120510.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(113.8889, grad_fn=<MseLossBackward>)
output :  tensor([[186398.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8107e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144290.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1978e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151539.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2687345.5000, grad_fn=<MseLossBackward>)
output :  tensor([[187588.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(26122.6406, grad_fn=<MseLossBackward>)
output :  tensor([[256527.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3359e+09, grad_fn=<MseLossBackward>)
output :  tensor([[92795.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1677146.3750, grad_fn=<MseLossBackward>)
output :  tensor([[240883.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(780572.2500, grad_fn=<MseLossBackward>)
output :  tensor([[128160.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(115525.6406, grad_fn=<MseLossBackward>)
output :  tensor([[165628.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0054e+10, grad_fn=<MseLossBackward>)
output :  tensor([[113104.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7174e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178692.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(7252080.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162051.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1310e+08, grad_fn=<MseLossBackward>)
output :  tensor([[153530.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3040e+08, grad_fn=<MseLossBackward>)
output :  tensor([[234170.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(23320298., grad_fn=<MseLossBackward>)
output :  tensor([[226944.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(9.6445e+08, grad_fn=<MseLossBackward>)
output :  tensor([[127402.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(162264.2031, grad_fn=<MseLossBackward>)
output :  tensor([[127470.7734]], grad_fn=<AddmmBackward>)
loss:  tensor(2163174.5000, grad_fn=<MseLossBackward>)
output :  tensor([[226514.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(236120.0625, grad_fn=<MseLossBackward>)
output :  tensor([[230296.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(13718343., grad_fn=<MseLossBackward>)
output :  tensor([[223363.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(11133692., grad_fn=<MseLossBackward>)
output :  tensor([[148192.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(36912.0156, grad_fn=<MseLossBackward>)
output :  tensor([[213500.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(12255251., grad_fn=<MseLossBackward>)
output :  tensor([[126598.1172]], grad_fn=<AddmmBackward>)
loss:  tensor(43535152., grad_fn=<MseLossBackward>)
output :  tensor([[133983.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2201931.5000, grad_fn=<MseLossBackward>)
output :  tensor([[313385.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2605803., grad_fn=<MseLossBackward>)
output :  tensor([[139613.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(1921472.5000, grad_fn=<MseLossBackward>)
output :  tensor([[119357.4922]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7413e+09, grad_fn=<MseLossBackward>)
output :  tensor([[107270.7578]], grad_fn=<AddmmBackward>)
loss:  tensor(4969520.5000, grad_fn=<MseLossBackward>)
output :  tensor([[155865.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7670e+08, grad_fn=<MseLossBackward>)
output :  tensor([[183767.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2733e+09, grad_fn=<MseLossBackward>)
output :  tensor([[174142.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1305949., grad_fn=<MseLossBackward>)
output :  tensor([[194141.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(47041596., grad_fn=<MseLossBackward>)
output :  tensor([[99220.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(608278.1250, grad_fn=<MseLossBackward>)
output :  tensor([[179787.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(620353.1250, grad_fn=<MseLossBackward>)
output :  tensor([[169777.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(3525945., grad_fn=<MseLossBackward>)
output :  tensor([[142120.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(9735180., grad_fn=<MseLossBackward>)
output :  tensor([[262683.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2961e+09, grad_fn=<MseLossBackward>)
output :  tensor([[141587.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2022e+09, grad_fn=<MseLossBackward>)
output :  tensor([[172289.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(505432.1250, grad_fn=<MseLossBackward>)
output :  tensor([[139634.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(133853.0781, grad_fn=<MseLossBackward>)
output :  tensor([[196687.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(14536109., grad_fn=<MseLossBackward>)
output :  tensor([[169030.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(939203.2500, grad_fn=<MseLossBackward>)
output :  tensor([[240991.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(9049286., grad_fn=<MseLossBackward>)
output :  tensor([[134321.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(31728.5156, grad_fn=<MseLossBackward>)
output :  tensor([[150538.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(1413423.7500, grad_fn=<MseLossBackward>)
output :  tensor([[213730.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1611828.6250, grad_fn=<MseLossBackward>)
output :  tensor([[158535.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(41792388., grad_fn=<MseLossBackward>)
output :  tensor([[197928.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(79726480., grad_fn=<MseLossBackward>)
output :  tensor([[131807.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3941e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130874.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(3514013.7500, grad_fn=<MseLossBackward>)
output :  tensor([[139178.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(674913.6250, grad_fn=<MseLossBackward>)
output :  tensor([[203527.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3524e+09, grad_fn=<MseLossBackward>)
output :  tensor([[167249.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7300e+09, grad_fn=<MseLossBackward>)
output :  tensor([[73373.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7884e+08, grad_fn=<MseLossBackward>)
output :  tensor([[90012.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(30388518., grad_fn=<MseLossBackward>)
output :  tensor([[251532.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(3098370., grad_fn=<MseLossBackward>)
output :  tensor([[205998.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(4.4889e+09, grad_fn=<MseLossBackward>)
output :  tensor([[115410.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(168535.9062, grad_fn=<MseLossBackward>)
output :  tensor([[160930.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0595e+08, grad_fn=<MseLossBackward>)
output :  tensor([[211195.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(77525552., grad_fn=<MseLossBackward>)
output :  tensor([[182652.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6296e+09, grad_fn=<MseLossBackward>)
output :  tensor([[161130.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(37578624., grad_fn=<MseLossBackward>)
output :  tensor([[169296.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(495110.1250, grad_fn=<MseLossBackward>)
output :  tensor([[115091.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(8356.5312, grad_fn=<MseLossBackward>)
output :  tensor([[157566.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(6586361., grad_fn=<MseLossBackward>)
output :  tensor([[194045.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6523e+08, grad_fn=<MseLossBackward>)
output :  tensor([[216129.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(11357216., grad_fn=<MseLossBackward>)
output :  tensor([[248749.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4626e+11, grad_fn=<MseLossBackward>)
output :  tensor([[143715.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(10786709., grad_fn=<MseLossBackward>)
output :  tensor([[110437.3672]], grad_fn=<AddmmBackward>)
loss:  tensor(3831286.2500, grad_fn=<MseLossBackward>)
output :  tensor([[173303.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(73899544., grad_fn=<MseLossBackward>)
output :  tensor([[151302.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(643880.8750, grad_fn=<MseLossBackward>)
output :  tensor([[236473.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(276758.1875, grad_fn=<MseLossBackward>)
output :  tensor([[114597.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(162157.2188, grad_fn=<MseLossBackward>)
output :  tensor([[184486.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(2515842., grad_fn=<MseLossBackward>)
output :  tensor([[183848.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(8133726., grad_fn=<MseLossBackward>)
output :  tensor([[164458.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4193e+10, grad_fn=<MseLossBackward>)
output :  tensor([[95946.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2340e+08, grad_fn=<MseLossBackward>)
output :  tensor([[239513.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(263874.8438, grad_fn=<MseLossBackward>)
output :  tensor([[179319.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(11016280., grad_fn=<MseLossBackward>)
output :  tensor([[141736.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(3014075.7500, grad_fn=<MseLossBackward>)
output :  tensor([[235493.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(243310.9844, grad_fn=<MseLossBackward>)
output :  tensor([[168674.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(32200128., grad_fn=<MseLossBackward>)
output :  tensor([[208991.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3458e+10, grad_fn=<MseLossBackward>)
output :  tensor([[135323.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(104803.9453, grad_fn=<MseLossBackward>)
output :  tensor([[188784.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(7.1742e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135834.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(27473.0625, grad_fn=<MseLossBackward>)
output :  tensor([[227586.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(70778832., grad_fn=<MseLossBackward>)
output :  tensor([[227895.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8859e+08, grad_fn=<MseLossBackward>)
output :  tensor([[92682.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(7193794.5000, grad_fn=<MseLossBackward>)
output :  tensor([[158367.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1138289., grad_fn=<MseLossBackward>)
output :  tensor([[247726.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5166e+10, grad_fn=<MseLossBackward>)
output :  tensor([[147966.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(8798546., grad_fn=<MseLossBackward>)
output :  tensor([[108670.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7364e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163842.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(432861.1875, grad_fn=<MseLossBackward>)
output :  tensor([[142765.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1523450.2500, grad_fn=<MseLossBackward>)
output :  tensor([[129425.]], grad_fn=<AddmmBackward>)
loss:  tensor(1500625., grad_fn=<MseLossBackward>)
output :  tensor([[189566.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8210e+09, grad_fn=<MseLossBackward>)
output :  tensor([[124920.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(5857043., grad_fn=<MseLossBackward>)
output :  tensor([[152971.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(943174.8125, grad_fn=<MseLossBackward>)
output :  tensor([[169633.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(4477786.5000, grad_fn=<MseLossBackward>)
output :  tensor([[151542.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(294153.6875, grad_fn=<MseLossBackward>)
output :  tensor([[164667.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3123945.7500, grad_fn=<MseLossBackward>)
output :  tensor([[137034.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8595e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135241.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(10509754., grad_fn=<MseLossBackward>)
output :  tensor([[155089.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.5888e+08, grad_fn=<MseLossBackward>)
output :  tensor([[144480.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(107727.5469, grad_fn=<MseLossBackward>)
output :  tensor([[163003.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1571967.3750, grad_fn=<MseLossBackward>)
output :  tensor([[133543.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5900e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148656.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(20466.8789, grad_fn=<MseLossBackward>)
output :  tensor([[184687.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(10974623., grad_fn=<MseLossBackward>)
output :  tensor([[167237.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(3108114., grad_fn=<MseLossBackward>)
output :  tensor([[183596.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(12934250., grad_fn=<MseLossBackward>)
output :  tensor([[220983.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(967764.0625, grad_fn=<MseLossBackward>)
output :  tensor([[109771.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(3502834., grad_fn=<MseLossBackward>)
output :  tensor([[135629.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1512e+08, grad_fn=<MseLossBackward>)
output :  tensor([[279840.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(37939824., grad_fn=<MseLossBackward>)
output :  tensor([[113614.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(5690871., grad_fn=<MseLossBackward>)
output :  tensor([[176572.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8859e+09, grad_fn=<MseLossBackward>)
output :  tensor([[182580.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(5853073., grad_fn=<MseLossBackward>)
output :  tensor([[197721.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4937e+08, grad_fn=<MseLossBackward>)
output :  tensor([[250192.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1539e+08, grad_fn=<MseLossBackward>)
output :  tensor([[221908.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(8395.1406, grad_fn=<MseLossBackward>)
output :  tensor([[120733.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2002e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173164.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0659e+08, grad_fn=<MseLossBackward>)
output :  tensor([[123434.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(319648.8750, grad_fn=<MseLossBackward>)
output :  tensor([[184647.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(6.4584e+10, grad_fn=<MseLossBackward>)
output :  tensor([[154837.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(3375085.7500, grad_fn=<MseLossBackward>)
output :  tensor([[153577.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(50087908., grad_fn=<MseLossBackward>)
output :  tensor([[200615.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(32311942., grad_fn=<MseLossBackward>)
output :  tensor([[143967.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3150e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175360.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(408760.4375, grad_fn=<MseLossBackward>)
output :  tensor([[253785.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6122e+08, grad_fn=<MseLossBackward>)
output :  tensor([[149302.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1695814.3750, grad_fn=<MseLossBackward>)
output :  tensor([[201200.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(2145309.5000, grad_fn=<MseLossBackward>)
output :  tensor([[157772.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(4739805., grad_fn=<MseLossBackward>)
output :  tensor([[120221.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0382e+09, grad_fn=<MseLossBackward>)
output :  tensor([[136691.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(886893.0625, grad_fn=<MseLossBackward>)
output :  tensor([[185825.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(3333648.2500, grad_fn=<MseLossBackward>)
output :  tensor([[196533.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(42688256., grad_fn=<MseLossBackward>)
output :  tensor([[240769.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3262e+09, grad_fn=<MseLossBackward>)
output :  tensor([[247764.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(85285800., grad_fn=<MseLossBackward>)
output :  tensor([[191280.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6312e+10, grad_fn=<MseLossBackward>)
output :  tensor([[142497.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2.6008e+09, grad_fn=<MseLossBackward>)
output :  tensor([[148389.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(15125050., grad_fn=<MseLossBackward>)
output :  tensor([[70816.5547]], grad_fn=<AddmmBackward>)
loss:  tensor(9.4966e+08, grad_fn=<MseLossBackward>)
output :  tensor([[136308.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1713194.6250, grad_fn=<MseLossBackward>)
output :  tensor([[130828.5078]], grad_fn=<AddmmBackward>)
loss:  tensor(3719142.5000, grad_fn=<MseLossBackward>)
output :  tensor([[155032.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1065894.8750, grad_fn=<MseLossBackward>)
output :  tensor([[127899.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(808678.6875, grad_fn=<MseLossBackward>)
output :  tensor([[79618.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(9723532., grad_fn=<MseLossBackward>)
output :  tensor([[85904.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(15243961., grad_fn=<MseLossBackward>)
output :  tensor([[238233.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(38855936., grad_fn=<MseLossBackward>)
output :  tensor([[140362.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7634e+08, grad_fn=<MseLossBackward>)
output :  tensor([[126549.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(15607438., grad_fn=<MseLossBackward>)
output :  tensor([[167681.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(464378.3750, grad_fn=<MseLossBackward>)
output :  tensor([[233096.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(3623074.2500, grad_fn=<MseLossBackward>)
output :  tensor([[190568.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(2469023., grad_fn=<MseLossBackward>)
output :  tensor([[155228.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(594947.0625, grad_fn=<MseLossBackward>)
output :  tensor([[196326.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2474722.2500, grad_fn=<MseLossBackward>)
output :  tensor([[209870.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3600e+08, grad_fn=<MseLossBackward>)
output :  tensor([[135835.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(1355914.7500, grad_fn=<MseLossBackward>)
output :  tensor([[153988.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1022942.6250, grad_fn=<MseLossBackward>)
output :  tensor([[138526.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(6380992., grad_fn=<MseLossBackward>)
output :  tensor([[202918.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(7.3341e+08, grad_fn=<MseLossBackward>)
output :  tensor([[157009.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(9058313., grad_fn=<MseLossBackward>)
output :  tensor([[137452.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9318e+09, grad_fn=<MseLossBackward>)
output :  tensor([[139845.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(25548760., grad_fn=<MseLossBackward>)
output :  tensor([[206330.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(32142876., grad_fn=<MseLossBackward>)
output :  tensor([[100621.2578]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4675e+08, grad_fn=<MseLossBackward>)
output :  tensor([[167788.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(83196.1875, grad_fn=<MseLossBackward>)
output :  tensor([[130147.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(4610347., grad_fn=<MseLossBackward>)
output :  tensor([[149132.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(4546223.5000, grad_fn=<MseLossBackward>)
output :  tensor([[103192.8672]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6654e+09, grad_fn=<MseLossBackward>)
output :  tensor([[139087.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2520255.5000, grad_fn=<MseLossBackward>)
output :  tensor([[237528.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(2335882.5000, grad_fn=<MseLossBackward>)
output :  tensor([[144900.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(9984.3809, grad_fn=<MseLossBackward>)
output :  tensor([[137423.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(5871.3906, grad_fn=<MseLossBackward>)
output :  tensor([[162120.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1642e+09, grad_fn=<MseLossBackward>)
output :  tensor([[271105.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(47527668., grad_fn=<MseLossBackward>)
output :  tensor([[174313.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(471732.8750, grad_fn=<MseLossBackward>)
output :  tensor([[105704.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(8578675., grad_fn=<MseLossBackward>)
output :  tensor([[202233.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(5.6651e+09, grad_fn=<MseLossBackward>)
output :  tensor([[155398.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(12967876., grad_fn=<MseLossBackward>)
output :  tensor([[162997.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5980e+10, grad_fn=<MseLossBackward>)
output :  tensor([[99240.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(883864.3750, grad_fn=<MseLossBackward>)
output :  tensor([[123575.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(608.7014, grad_fn=<MseLossBackward>)
output :  tensor([[155887.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(12751.3496, grad_fn=<MseLossBackward>)
output :  tensor([[141462.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(2137581., grad_fn=<MseLossBackward>)
output :  tensor([[201202.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1447133.8750, grad_fn=<MseLossBackward>)
output :  tensor([[143828.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(3344040.7500, grad_fn=<MseLossBackward>)
output :  tensor([[261428.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(725770.8750, grad_fn=<MseLossBackward>)
output :  tensor([[126454.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1192e+09, grad_fn=<MseLossBackward>)
output :  tensor([[167367.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3486039., grad_fn=<MseLossBackward>)
output :  tensor([[187462.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(1076082., grad_fn=<MseLossBackward>)
output :  tensor([[124145.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0010e+08, grad_fn=<MseLossBackward>)
output :  tensor([[249190.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(655189.0625, grad_fn=<MseLossBackward>)
output :  tensor([[159204.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(7.7258e+08, grad_fn=<MseLossBackward>)
output :  tensor([[244914.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(189850.8281, grad_fn=<MseLossBackward>)
output :  tensor([[145182.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1399378.1250, grad_fn=<MseLossBackward>)
output :  tensor([[214000.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(16006501., grad_fn=<MseLossBackward>)
output :  tensor([[175658.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(10615480., grad_fn=<MseLossBackward>)
output :  tensor([[154339.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(115281.4688, grad_fn=<MseLossBackward>)
output :  tensor([[118624.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(389736.8438, grad_fn=<MseLossBackward>)
output :  tensor([[238275.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3829e+09, grad_fn=<MseLossBackward>)
output :  tensor([[236965.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(9205535., grad_fn=<MseLossBackward>)
output :  tensor([[154722.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1919263.8750, grad_fn=<MseLossBackward>)
output :  tensor([[254659.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(57772.6289, grad_fn=<MseLossBackward>)
output :  tensor([[124162.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(93294768., grad_fn=<MseLossBackward>)
output :  tensor([[176581.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(337869.7188, grad_fn=<MseLossBackward>)
output :  tensor([[161253.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1572359.2500, grad_fn=<MseLossBackward>)
output :  tensor([[133814.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(7923697., grad_fn=<MseLossBackward>)
output :  tensor([[193268.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0664e+09, grad_fn=<MseLossBackward>)
output :  tensor([[162245.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(3078983., grad_fn=<MseLossBackward>)
output :  tensor([[159454.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(12572121., grad_fn=<MseLossBackward>)
output :  tensor([[155431.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(6596710.5000, grad_fn=<MseLossBackward>)
output :  tensor([[154918.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(25182048., grad_fn=<MseLossBackward>)
output :  tensor([[171371.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8280e+09, grad_fn=<MseLossBackward>)
output :  tensor([[158124.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(3515742.2500, grad_fn=<MseLossBackward>)
output :  tensor([[377856.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(37380232., grad_fn=<MseLossBackward>)
output :  tensor([[141853.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2062e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130381.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0143e+09, grad_fn=<MseLossBackward>)
output :  tensor([[276707.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(20299530., grad_fn=<MseLossBackward>)
output :  tensor([[160050.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3801403.2500, grad_fn=<MseLossBackward>)
output :  tensor([[131298.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1661e+08, grad_fn=<MseLossBackward>)
output :  tensor([[223992.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(64117552., grad_fn=<MseLossBackward>)
output :  tensor([[178791.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(2917851.2500, grad_fn=<MseLossBackward>)
output :  tensor([[152533.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(284722.2812, grad_fn=<MseLossBackward>)
output :  tensor([[144585.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(171939.8125, grad_fn=<MseLossBackward>)
output :  tensor([[154997.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2753e+08, grad_fn=<MseLossBackward>)
output :  tensor([[103924.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(15405318., grad_fn=<MseLossBackward>)
output :  tensor([[71618.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3499e+08, grad_fn=<MseLossBackward>)
output :  tensor([[164280.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(517275.6250, grad_fn=<MseLossBackward>)
output :  tensor([[191513.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3313e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159686.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2845494.5000, grad_fn=<MseLossBackward>)
output :  tensor([[154691.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(7887321., grad_fn=<MseLossBackward>)
output :  tensor([[137319.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(17140.5371, grad_fn=<MseLossBackward>)
output :  tensor([[205645.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(92882.0859, grad_fn=<MseLossBackward>)
output :  tensor([[139133.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1285459.8750, grad_fn=<MseLossBackward>)
output :  tensor([[182915.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6151e+10, grad_fn=<MseLossBackward>)
output :  tensor([[145745.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(64881.6406, grad_fn=<MseLossBackward>)
output :  tensor([[111180.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9412e+08, grad_fn=<MseLossBackward>)
output :  tensor([[95555.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2420552.5000, grad_fn=<MseLossBackward>)
output :  tensor([[175159.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(25545.0293, grad_fn=<MseLossBackward>)
output :  tensor([[264684.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(18355334., grad_fn=<MseLossBackward>)
output :  tensor([[143685.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(4775522.5000, grad_fn=<MseLossBackward>)
output :  tensor([[158371.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2321861.7500, grad_fn=<MseLossBackward>)
output :  tensor([[134156.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(2744147.5000, grad_fn=<MseLossBackward>)
output :  tensor([[145161.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(18823532., grad_fn=<MseLossBackward>)
output :  tensor([[168376.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(226620.6250, grad_fn=<MseLossBackward>)
output :  tensor([[125864.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(1288668.3750, grad_fn=<MseLossBackward>)
output :  tensor([[170654.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5816e+08, grad_fn=<MseLossBackward>)
output :  tensor([[156928.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(5052.0996, grad_fn=<MseLossBackward>)
output :  tensor([[118509.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(4038655.5000, grad_fn=<MseLossBackward>)
output :  tensor([[161279.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1439e+09, grad_fn=<MseLossBackward>)
output :  tensor([[56281.0977]], grad_fn=<AddmmBackward>)
loss:  tensor(18327798., grad_fn=<MseLossBackward>)
output :  tensor([[233801.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1934e+09, grad_fn=<MseLossBackward>)
output :  tensor([[202991.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(3965263.2500, grad_fn=<MseLossBackward>)
output :  tensor([[182659.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(5479037.5000, grad_fn=<MseLossBackward>)
output :  tensor([[107784.8984]], grad_fn=<AddmmBackward>)
loss:  tensor(3185862.5000, grad_fn=<MseLossBackward>)
output :  tensor([[88325.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(1757716.6250, grad_fn=<MseLossBackward>)
output :  tensor([[145073.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(25744366., grad_fn=<MseLossBackward>)
output :  tensor([[222052.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(5.1764e+09, grad_fn=<MseLossBackward>)
output :  tensor([[205837.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(2764062., grad_fn=<MseLossBackward>)
output :  tensor([[165773.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(598471.4375, grad_fn=<MseLossBackward>)
output :  tensor([[176102.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9027e+09, grad_fn=<MseLossBackward>)
output :  tensor([[192934.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(8611382., grad_fn=<MseLossBackward>)
output :  tensor([[87368.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(135475.7500, grad_fn=<MseLossBackward>)
output :  tensor([[137761.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(5012561.5000, grad_fn=<MseLossBackward>)
output :  tensor([[111242.2891]], grad_fn=<AddmmBackward>)
loss:  tensor(550993.0625, grad_fn=<MseLossBackward>)
output :  tensor([[146475.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1058e+08, grad_fn=<MseLossBackward>)
output :  tensor([[171528.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6426e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195776.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(85068632., grad_fn=<MseLossBackward>)
output :  tensor([[182028.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(4113037.5000, grad_fn=<MseLossBackward>)
output :  tensor([[97294.3203]], grad_fn=<AddmmBackward>)
loss:  tensor(630944.7500, grad_fn=<MseLossBackward>)
output :  tensor([[116087.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(1996017.1250, grad_fn=<MseLossBackward>)
output :  tensor([[160964.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3062e+08, grad_fn=<MseLossBackward>)
output :  tensor([[198804.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(1428884., grad_fn=<MseLossBackward>)
output :  tensor([[142857.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1306270.3750, grad_fn=<MseLossBackward>)
train_loss: [2.5329272e+09]
epoch_result tensor([0.])
output :  tensor([[159921.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2019862.7500, grad_fn=<MseLossBackward>)
output :  tensor([[121406.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(352409.1875, grad_fn=<MseLossBackward>)
output :  tensor([[193262.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(881544.9375, grad_fn=<MseLossBackward>)
output :  tensor([[179836.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(8045643.5000, grad_fn=<MseLossBackward>)
output :  tensor([[151406.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0724e+08, grad_fn=<MseLossBackward>)
output :  tensor([[127814.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(34505.9648, grad_fn=<MseLossBackward>)
output :  tensor([[142077.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1161006.2500, grad_fn=<MseLossBackward>)
output :  tensor([[119372.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(138477.0156, grad_fn=<MseLossBackward>)
output :  tensor([[64425.8477]], grad_fn=<AddmmBackward>)
loss:  tensor(35115672., grad_fn=<MseLossBackward>)
output :  tensor([[166133.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(17947.6250, grad_fn=<MseLossBackward>)
output :  tensor([[144322.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(18686572., grad_fn=<MseLossBackward>)
output :  tensor([[227057.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(4233949., grad_fn=<MseLossBackward>)
output :  tensor([[167239.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(3099965.5000, grad_fn=<MseLossBackward>)
output :  tensor([[248369.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1769440.3750, grad_fn=<MseLossBackward>)
output :  tensor([[52019.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(8885336., grad_fn=<MseLossBackward>)
output :  tensor([[158966.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0929e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175401.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(161302.6406, grad_fn=<MseLossBackward>)
output :  tensor([[162615.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(37394752., grad_fn=<MseLossBackward>)
output :  tensor([[275020.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(425.3906, grad_fn=<MseLossBackward>)
output :  tensor([[195929.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(1145502., grad_fn=<MseLossBackward>)
output :  tensor([[138353.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5156e+10, grad_fn=<MseLossBackward>)
output :  tensor([[195380.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2255628.5000, grad_fn=<MseLossBackward>)
output :  tensor([[178258.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1755e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151325.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(106031.6406, grad_fn=<MseLossBackward>)
output :  tensor([[165489.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(20340382., grad_fn=<MseLossBackward>)
output :  tensor([[86159.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(577540.6250, grad_fn=<MseLossBackward>)
output :  tensor([[169584.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2018e+09, grad_fn=<MseLossBackward>)
output :  tensor([[185202.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(41025.2383, grad_fn=<MseLossBackward>)
output :  tensor([[208932.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1685e+09, grad_fn=<MseLossBackward>)
output :  tensor([[109643.4922]], grad_fn=<AddmmBackward>)
loss:  tensor(127097.8203, grad_fn=<MseLossBackward>)
output :  tensor([[170490.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(259924.7188, grad_fn=<MseLossBackward>)
output :  tensor([[138512.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(4049087.2500, grad_fn=<MseLossBackward>)
output :  tensor([[128776.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(50092.0352, grad_fn=<MseLossBackward>)
output :  tensor([[123209.8047]], grad_fn=<AddmmBackward>)
loss:  tensor(13762651., grad_fn=<MseLossBackward>)
output :  tensor([[144735.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6926e+08, grad_fn=<MseLossBackward>)
output :  tensor([[168932.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1336e+10, grad_fn=<MseLossBackward>)
output :  tensor([[148963.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(542110.0625, grad_fn=<MseLossBackward>)
output :  tensor([[178992.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1015749., grad_fn=<MseLossBackward>)
output :  tensor([[141005.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(34.6995, grad_fn=<MseLossBackward>)
output :  tensor([[107141.0391]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9382e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134024.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5571e+09, grad_fn=<MseLossBackward>)
output :  tensor([[137453.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(6017592.5000, grad_fn=<MseLossBackward>)
output :  tensor([[138323.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2822e+08, grad_fn=<MseLossBackward>)
output :  tensor([[222224.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(7702186., grad_fn=<MseLossBackward>)
output :  tensor([[132647.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(158229.9219, grad_fn=<MseLossBackward>)
output :  tensor([[150373.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1885772.6250, grad_fn=<MseLossBackward>)
output :  tensor([[113398.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1955758.5000, grad_fn=<MseLossBackward>)
output :  tensor([[160538.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(290184.2188, grad_fn=<MseLossBackward>)
output :  tensor([[148239.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1866e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194810.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(7896188., grad_fn=<MseLossBackward>)
output :  tensor([[135180.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(533287.8750, grad_fn=<MseLossBackward>)
output :  tensor([[102725.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(52920852., grad_fn=<MseLossBackward>)
output :  tensor([[235301.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(1694024.2500, grad_fn=<MseLossBackward>)
output :  tensor([[167378.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1263e+09, grad_fn=<MseLossBackward>)
output :  tensor([[165754.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(45621160., grad_fn=<MseLossBackward>)
output :  tensor([[202773.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8807e+10, grad_fn=<MseLossBackward>)
output :  tensor([[247590.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1323e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143544.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(2013.7656, grad_fn=<MseLossBackward>)
output :  tensor([[143901.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(98036920., grad_fn=<MseLossBackward>)
output :  tensor([[158250.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(10568290., grad_fn=<MseLossBackward>)
output :  tensor([[135291.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(27998318., grad_fn=<MseLossBackward>)
output :  tensor([[178599.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6261e+09, grad_fn=<MseLossBackward>)
output :  tensor([[182893.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1454662.1250, grad_fn=<MseLossBackward>)
output :  tensor([[162499.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(998906.5625, grad_fn=<MseLossBackward>)
output :  tensor([[146630.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(13183026., grad_fn=<MseLossBackward>)
output :  tensor([[142870.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(137409.2188, grad_fn=<MseLossBackward>)
output :  tensor([[143516.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(2201143.2500, grad_fn=<MseLossBackward>)
output :  tensor([[171892.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5960e+09, grad_fn=<MseLossBackward>)
output :  tensor([[195031.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8262e+08, grad_fn=<MseLossBackward>)
output :  tensor([[134832.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(2780556.2500, grad_fn=<MseLossBackward>)
output :  tensor([[177062.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(26649470., grad_fn=<MseLossBackward>)
output :  tensor([[176908.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(16743569., grad_fn=<MseLossBackward>)
output :  tensor([[116356.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(1839901.5000, grad_fn=<MseLossBackward>)
output :  tensor([[219950.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1102171.8750, grad_fn=<MseLossBackward>)
output :  tensor([[183301.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(39296.8672, grad_fn=<MseLossBackward>)
output :  tensor([[128607.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(9654711., grad_fn=<MseLossBackward>)
output :  tensor([[199775.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(10731664., grad_fn=<MseLossBackward>)
output :  tensor([[176402.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(2258586.2500, grad_fn=<MseLossBackward>)
output :  tensor([[211106.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0675e+10, grad_fn=<MseLossBackward>)
output :  tensor([[210607.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(153933.6250, grad_fn=<MseLossBackward>)
output :  tensor([[161539.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(9.3263e+08, grad_fn=<MseLossBackward>)
output :  tensor([[196235.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(3010930., grad_fn=<MseLossBackward>)
output :  tensor([[112361.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(407821.9375, grad_fn=<MseLossBackward>)
output :  tensor([[114640.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(4580536.5000, grad_fn=<MseLossBackward>)
output :  tensor([[114214.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(4904391., grad_fn=<MseLossBackward>)
output :  tensor([[148354.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(2415547.2500, grad_fn=<MseLossBackward>)
output :  tensor([[158563.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3885e+10, grad_fn=<MseLossBackward>)
output :  tensor([[179193.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(650492.6875, grad_fn=<MseLossBackward>)
output :  tensor([[128571.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1148949.5000, grad_fn=<MseLossBackward>)
output :  tensor([[148287.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(10808273., grad_fn=<MseLossBackward>)
output :  tensor([[176549.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7347e+09, grad_fn=<MseLossBackward>)
output :  tensor([[122015.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(26172336., grad_fn=<MseLossBackward>)
output :  tensor([[193392.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(13012253., grad_fn=<MseLossBackward>)
output :  tensor([[147146.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(4605919.5000, grad_fn=<MseLossBackward>)
output :  tensor([[212672.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(51798.9141, grad_fn=<MseLossBackward>)
output :  tensor([[127694.6797]], grad_fn=<AddmmBackward>)
loss:  tensor(2871939.2500, grad_fn=<MseLossBackward>)
output :  tensor([[247617.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(505098.9375, grad_fn=<MseLossBackward>)
output :  tensor([[240419.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9874e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145961.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1204e+08, grad_fn=<MseLossBackward>)
output :  tensor([[86204.5703]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3527e+08, grad_fn=<MseLossBackward>)
output :  tensor([[196229.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(6.1891e+09, grad_fn=<MseLossBackward>)
output :  tensor([[81851.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(725251.8125, grad_fn=<MseLossBackward>)
output :  tensor([[137805.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2871065.5000, grad_fn=<MseLossBackward>)
output :  tensor([[78354.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(8147858., grad_fn=<MseLossBackward>)
output :  tensor([[143400.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(200326.1719, grad_fn=<MseLossBackward>)
output :  tensor([[171678.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(18674012., grad_fn=<MseLossBackward>)
output :  tensor([[151931.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(2460388.2500, grad_fn=<MseLossBackward>)
output :  tensor([[108152.6484]], grad_fn=<AddmmBackward>)
loss:  tensor(566479.6875, grad_fn=<MseLossBackward>)
output :  tensor([[204690.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2334e+10, grad_fn=<MseLossBackward>)
output :  tensor([[129646.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(1314516., grad_fn=<MseLossBackward>)
output :  tensor([[267812.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4853e+08, grad_fn=<MseLossBackward>)
output :  tensor([[307963.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(4146568.5000, grad_fn=<MseLossBackward>)
output :  tensor([[110107.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(6797345., grad_fn=<MseLossBackward>)
output :  tensor([[170993.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(2270625.2500, grad_fn=<MseLossBackward>)
output :  tensor([[132627.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0651e+08, grad_fn=<MseLossBackward>)
output :  tensor([[140350.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1824103.5000, grad_fn=<MseLossBackward>)
output :  tensor([[132106.]], grad_fn=<AddmmBackward>)
loss:  tensor(3444736., grad_fn=<MseLossBackward>)
output :  tensor([[127965.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(8793217., grad_fn=<MseLossBackward>)
output :  tensor([[133676.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(5.8451e+08, grad_fn=<MseLossBackward>)
output :  tensor([[225508.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9003e+10, grad_fn=<MseLossBackward>)
output :  tensor([[190318.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2705e+10, grad_fn=<MseLossBackward>)
output :  tensor([[141163.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(7486380., grad_fn=<MseLossBackward>)
output :  tensor([[129507.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(4028707.5000, grad_fn=<MseLossBackward>)
output :  tensor([[110314.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(875862., grad_fn=<MseLossBackward>)
output :  tensor([[254215.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0762e+09, grad_fn=<MseLossBackward>)
output :  tensor([[133364.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(2673736., grad_fn=<MseLossBackward>)
output :  tensor([[196952.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(36575280., grad_fn=<MseLossBackward>)
output :  tensor([[110193.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(28024616., grad_fn=<MseLossBackward>)
output :  tensor([[140967.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(1035147.2500, grad_fn=<MseLossBackward>)
output :  tensor([[210972.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8300e+08, grad_fn=<MseLossBackward>)
output :  tensor([[182140.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(5018020., grad_fn=<MseLossBackward>)
output :  tensor([[186654.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2736543., grad_fn=<MseLossBackward>)
output :  tensor([[163973.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1033e+10, grad_fn=<MseLossBackward>)
output :  tensor([[304612.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2342e+08, grad_fn=<MseLossBackward>)
output :  tensor([[197516.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(147216.0938, grad_fn=<MseLossBackward>)
output :  tensor([[260090.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0383e+10, grad_fn=<MseLossBackward>)
output :  tensor([[222903.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8573e+09, grad_fn=<MseLossBackward>)
output :  tensor([[283622.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1141e+09, grad_fn=<MseLossBackward>)
output :  tensor([[222928.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1147375.7500, grad_fn=<MseLossBackward>)
output :  tensor([[223083.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8533e+10, grad_fn=<MseLossBackward>)
output :  tensor([[198841.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(3389396., grad_fn=<MseLossBackward>)
output :  tensor([[157031.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8579e+08, grad_fn=<MseLossBackward>)
output :  tensor([[130786.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(2937073., grad_fn=<MseLossBackward>)
output :  tensor([[133151.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(5513764.5000, grad_fn=<MseLossBackward>)
output :  tensor([[90810.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(35732.8125, grad_fn=<MseLossBackward>)
output :  tensor([[107728.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(73453.7031, grad_fn=<MseLossBackward>)
output :  tensor([[273328.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(3.0882e+09, grad_fn=<MseLossBackward>)
output :  tensor([[234397.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(362648.5938, grad_fn=<MseLossBackward>)
output :  tensor([[144471.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(279378.3125, grad_fn=<MseLossBackward>)
output :  tensor([[137799.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(89513.1562, grad_fn=<MseLossBackward>)
output :  tensor([[173785.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(2717.0156, grad_fn=<MseLossBackward>)
output :  tensor([[148472.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(10384808., grad_fn=<MseLossBackward>)
output :  tensor([[166873.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6320e+08, grad_fn=<MseLossBackward>)
output :  tensor([[164752.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(61132.5625, grad_fn=<MseLossBackward>)
output :  tensor([[136956.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1861.1135, grad_fn=<MseLossBackward>)
output :  tensor([[188557.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3636e+09, grad_fn=<MseLossBackward>)
output :  tensor([[111865.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(18134.4102, grad_fn=<MseLossBackward>)
output :  tensor([[161402.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1231e+08, grad_fn=<MseLossBackward>)
output :  tensor([[120240.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(57641.2578, grad_fn=<MseLossBackward>)
output :  tensor([[84395.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(6785618., grad_fn=<MseLossBackward>)
output :  tensor([[177757.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(5029927.5000, grad_fn=<MseLossBackward>)
output :  tensor([[109917.4453]], grad_fn=<AddmmBackward>)
loss:  tensor(304.3389, grad_fn=<MseLossBackward>)
output :  tensor([[239450.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(203274.1719, grad_fn=<MseLossBackward>)
output :  tensor([[246669.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2788221.5000, grad_fn=<MseLossBackward>)
output :  tensor([[125827.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(13484961., grad_fn=<MseLossBackward>)
output :  tensor([[112230.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(10704144., grad_fn=<MseLossBackward>)
output :  tensor([[289646.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1758e+10, grad_fn=<MseLossBackward>)
output :  tensor([[170839.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(436198.3438, grad_fn=<MseLossBackward>)
output :  tensor([[125081.1641]], grad_fn=<AddmmBackward>)
loss:  tensor(6587.6050, grad_fn=<MseLossBackward>)
output :  tensor([[144842.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2052e+08, grad_fn=<MseLossBackward>)
output :  tensor([[204285.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(94373032., grad_fn=<MseLossBackward>)
output :  tensor([[143019.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(4079958.2500, grad_fn=<MseLossBackward>)
output :  tensor([[159174.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4599e+10, grad_fn=<MseLossBackward>)
output :  tensor([[154006.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(11345.5781, grad_fn=<MseLossBackward>)
output :  tensor([[130676.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(1383894.8750, grad_fn=<MseLossBackward>)
output :  tensor([[252408.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5899e+10, grad_fn=<MseLossBackward>)
output :  tensor([[400125.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(3512227.5000, grad_fn=<MseLossBackward>)
output :  tensor([[105421.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(12807228., grad_fn=<MseLossBackward>)
output :  tensor([[116351.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(4616321., grad_fn=<MseLossBackward>)
output :  tensor([[162249.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(7558633.5000, grad_fn=<MseLossBackward>)
output :  tensor([[128364.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5720e+08, grad_fn=<MseLossBackward>)
output :  tensor([[162910.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4915e+09, grad_fn=<MseLossBackward>)
output :  tensor([[172816.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(3.9459e+09, grad_fn=<MseLossBackward>)
output :  tensor([[105264.2734]], grad_fn=<AddmmBackward>)
loss:  tensor(2769806., grad_fn=<MseLossBackward>)
output :  tensor([[141491.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(241219.1094, grad_fn=<MseLossBackward>)
output :  tensor([[359132.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(66603452., grad_fn=<MseLossBackward>)
output :  tensor([[208216.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0961e+09, grad_fn=<MseLossBackward>)
output :  tensor([[176112.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(375385.9688, grad_fn=<MseLossBackward>)
output :  tensor([[200760.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(4576390.5000, grad_fn=<MseLossBackward>)
output :  tensor([[141860.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(8184963.5000, grad_fn=<MseLossBackward>)
output :  tensor([[195681.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(1397013.2500, grad_fn=<MseLossBackward>)
output :  tensor([[133378.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6967e+08, grad_fn=<MseLossBackward>)
output :  tensor([[177774.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(10406068., grad_fn=<MseLossBackward>)
output :  tensor([[244164.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(4685804.5000, grad_fn=<MseLossBackward>)
output :  tensor([[172617.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1910442.2500, grad_fn=<MseLossBackward>)
output :  tensor([[107852.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(21793.1406, grad_fn=<MseLossBackward>)
output :  tensor([[264484.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(5842.6914, grad_fn=<MseLossBackward>)
output :  tensor([[247686.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(5353583.5000, grad_fn=<MseLossBackward>)
output :  tensor([[120704.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(5269750.5000, grad_fn=<MseLossBackward>)
output :  tensor([[217177.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3434e+09, grad_fn=<MseLossBackward>)
output :  tensor([[307230.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2650e+08, grad_fn=<MseLossBackward>)
output :  tensor([[206662.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(113958.9922, grad_fn=<MseLossBackward>)
output :  tensor([[214480.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5755e+10, grad_fn=<MseLossBackward>)
output :  tensor([[158917.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1035051.8750, grad_fn=<MseLossBackward>)
output :  tensor([[169729.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(67990.5625, grad_fn=<MseLossBackward>)
output :  tensor([[160599.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(13451015., grad_fn=<MseLossBackward>)
output :  tensor([[171187.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1409525.5000, grad_fn=<MseLossBackward>)
output :  tensor([[240757.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4216e+08, grad_fn=<MseLossBackward>)
output :  tensor([[228872.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(340837.0312, grad_fn=<MseLossBackward>)
output :  tensor([[160001.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6904e+08, grad_fn=<MseLossBackward>)
output :  tensor([[120329.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(7134199.5000, grad_fn=<MseLossBackward>)
output :  tensor([[177648.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(421018.5000, grad_fn=<MseLossBackward>)
output :  tensor([[180356.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(6.3431e+09, grad_fn=<MseLossBackward>)
output :  tensor([[210607.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(3.3860e+10, grad_fn=<MseLossBackward>)
output :  tensor([[136026.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2541633., grad_fn=<MseLossBackward>)
output :  tensor([[145019.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4846e+08, grad_fn=<MseLossBackward>)
output :  tensor([[277766.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(588001.4375, grad_fn=<MseLossBackward>)
output :  tensor([[89047.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(16384027., grad_fn=<MseLossBackward>)
output :  tensor([[237398.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(807976.2500, grad_fn=<MseLossBackward>)
output :  tensor([[261704.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0319e+11, grad_fn=<MseLossBackward>)
output :  tensor([[171750.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(3065453.7500, grad_fn=<MseLossBackward>)
output :  tensor([[195796.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5369e+09, grad_fn=<MseLossBackward>)
output :  tensor([[152837.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(4677622.5000, grad_fn=<MseLossBackward>)
output :  tensor([[206415.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0431e+09, grad_fn=<MseLossBackward>)
output :  tensor([[125647.4609]], grad_fn=<AddmmBackward>)
loss:  tensor(11239518., grad_fn=<MseLossBackward>)
output :  tensor([[148548.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(12591741., grad_fn=<MseLossBackward>)
output :  tensor([[169398.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2351e+08, grad_fn=<MseLossBackward>)
output :  tensor([[188744.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(8376502., grad_fn=<MseLossBackward>)
output :  tensor([[127590.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(2530386.2500, grad_fn=<MseLossBackward>)
output :  tensor([[139236.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(7488261., grad_fn=<MseLossBackward>)
output :  tensor([[175629.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(6913284., grad_fn=<MseLossBackward>)
output :  tensor([[196331.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8803e+09, grad_fn=<MseLossBackward>)
output :  tensor([[237524.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(29985036., grad_fn=<MseLossBackward>)
output :  tensor([[154408.]], grad_fn=<AddmmBackward>)
loss:  tensor(350464., grad_fn=<MseLossBackward>)
output :  tensor([[193909.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(4371823.5000, grad_fn=<MseLossBackward>)
output :  tensor([[158325.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0523e+08, grad_fn=<MseLossBackward>)
output :  tensor([[196388.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8523e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180696.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(633790.1250, grad_fn=<MseLossBackward>)
output :  tensor([[100706.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(13740980., grad_fn=<MseLossBackward>)
output :  tensor([[172617.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1531e+10, grad_fn=<MseLossBackward>)
output :  tensor([[135661.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(437354.8750, grad_fn=<MseLossBackward>)
output :  tensor([[118055.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(9335078., grad_fn=<MseLossBackward>)
output :  tensor([[171775.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(4948330.5000, grad_fn=<MseLossBackward>)
output :  tensor([[88069.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(9423173., grad_fn=<MseLossBackward>)
output :  tensor([[298160.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(66594272., grad_fn=<MseLossBackward>)
output :  tensor([[163333.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2775868.5000, grad_fn=<MseLossBackward>)
output :  tensor([[193439.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9524e+10, grad_fn=<MseLossBackward>)
output :  tensor([[248899.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8841e+08, grad_fn=<MseLossBackward>)
output :  tensor([[148228.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(7679220.5000, grad_fn=<MseLossBackward>)
output :  tensor([[124668.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(446474.5312, grad_fn=<MseLossBackward>)
output :  tensor([[121424.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(2323314.2500, grad_fn=<MseLossBackward>)
output :  tensor([[143830.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3120e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175367.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(1870056.2500, grad_fn=<MseLossBackward>)
output :  tensor([[110157.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6491e+08, grad_fn=<MseLossBackward>)
output :  tensor([[212813.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1064e+10, grad_fn=<MseLossBackward>)
output :  tensor([[245398.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(15200130., grad_fn=<MseLossBackward>)
output :  tensor([[251865.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0543e+10, grad_fn=<MseLossBackward>)
output :  tensor([[221975.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8983e+08, grad_fn=<MseLossBackward>)
output :  tensor([[196715.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4110e+10, grad_fn=<MseLossBackward>)
output :  tensor([[190233.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(7472876.5000, grad_fn=<MseLossBackward>)
output :  tensor([[207042.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4.7449e+10, grad_fn=<MseLossBackward>)
output :  tensor([[190543.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1158e+10, grad_fn=<MseLossBackward>)
output :  tensor([[177920.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(670812.1875, grad_fn=<MseLossBackward>)
output :  tensor([[150118.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(3538690., grad_fn=<MseLossBackward>)
output :  tensor([[334344.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(7052676., grad_fn=<MseLossBackward>)
output :  tensor([[212659.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(435517.5000, grad_fn=<MseLossBackward>)
output :  tensor([[158177.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3321620.2500, grad_fn=<MseLossBackward>)
output :  tensor([[188658.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7922e+09, grad_fn=<MseLossBackward>)
output :  tensor([[109554.4141]], grad_fn=<AddmmBackward>)
loss:  tensor(20742688., grad_fn=<MseLossBackward>)
output :  tensor([[273502.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(7.9241e+10, grad_fn=<MseLossBackward>)
output :  tensor([[174294.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(155765.8906, grad_fn=<MseLossBackward>)
output :  tensor([[213077.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(178506.2500, grad_fn=<MseLossBackward>)
output :  tensor([[215137.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(34371472., grad_fn=<MseLossBackward>)
output :  tensor([[178721.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(229186.6094, grad_fn=<MseLossBackward>)
output :  tensor([[201754.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(2113.1260, grad_fn=<MseLossBackward>)
output :  tensor([[157824.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(7978683., grad_fn=<MseLossBackward>)
output :  tensor([[147886.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.2931e+09, grad_fn=<MseLossBackward>)
output :  tensor([[118263.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(55817.7539, grad_fn=<MseLossBackward>)
output :  tensor([[138743.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(1577889.2500, grad_fn=<MseLossBackward>)
output :  tensor([[147087.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(3656819.5000, grad_fn=<MseLossBackward>)
output :  tensor([[201841.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5916e+10, grad_fn=<MseLossBackward>)
output :  tensor([[160393.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(797476.9375, grad_fn=<MseLossBackward>)
output :  tensor([[99891.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(153174.3906, grad_fn=<MseLossBackward>)
output :  tensor([[226265.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8864e+08, grad_fn=<MseLossBackward>)
output :  tensor([[185074.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8316e+08, grad_fn=<MseLossBackward>)
output :  tensor([[174783.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(2896165.7500, grad_fn=<MseLossBackward>)
output :  tensor([[80888.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1236370.2500, grad_fn=<MseLossBackward>)
output :  tensor([[129467.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(936237.6875, grad_fn=<MseLossBackward>)
output :  tensor([[214072.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(5269.8525, grad_fn=<MseLossBackward>)
output :  tensor([[143075.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(855422.6875, grad_fn=<MseLossBackward>)
output :  tensor([[131421.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2019951.5000, grad_fn=<MseLossBackward>)
output :  tensor([[141998.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(362046.6562, grad_fn=<MseLossBackward>)
output :  tensor([[174617.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3777e+09, grad_fn=<MseLossBackward>)
output :  tensor([[144776.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(603243.5000, grad_fn=<MseLossBackward>)
output :  tensor([[160763.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(582312.0625, grad_fn=<MseLossBackward>)
output :  tensor([[216129.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(1275170.2500, grad_fn=<MseLossBackward>)
output :  tensor([[134054.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(8.4419e+08, grad_fn=<MseLossBackward>)
output :  tensor([[253871.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1272877.5000, grad_fn=<MseLossBackward>)
output :  tensor([[155839.3906]], grad_fn=<AddmmBackward>)
loss:  tensor(13400061., grad_fn=<MseLossBackward>)
output :  tensor([[131400.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(8412175., grad_fn=<MseLossBackward>)
output :  tensor([[95383.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(146892.5469, grad_fn=<MseLossBackward>)
output :  tensor([[151993.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5554e+09, grad_fn=<MseLossBackward>)
output :  tensor([[178285.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(2606055.2500, grad_fn=<MseLossBackward>)
output :  tensor([[118947.2109]], grad_fn=<AddmmBackward>)
loss:  tensor(2411153.7500, grad_fn=<MseLossBackward>)
output :  tensor([[189204.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5797e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145089.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(4.3020e+09, grad_fn=<MseLossBackward>)
output :  tensor([[151521.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(2630580., grad_fn=<MseLossBackward>)
output :  tensor([[187213.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(288318.6562, grad_fn=<MseLossBackward>)
output :  tensor([[254291.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5043e+09, grad_fn=<MseLossBackward>)
output :  tensor([[89147.3047]], grad_fn=<AddmmBackward>)
loss:  tensor(5535175., grad_fn=<MseLossBackward>)
output :  tensor([[237076.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(8547949., grad_fn=<MseLossBackward>)
output :  tensor([[130432.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(3735009.2500, grad_fn=<MseLossBackward>)
output :  tensor([[165842.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0011e+10, grad_fn=<MseLossBackward>)
output :  tensor([[114667.8828]], grad_fn=<AddmmBackward>)
loss:  tensor(2.1515e+08, grad_fn=<MseLossBackward>)
output :  tensor([[178453.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(6020045.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162955.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5486e+08, grad_fn=<MseLossBackward>)
output :  tensor([[153468.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(5.2756e+08, grad_fn=<MseLossBackward>)
output :  tensor([[235935.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(9392309., grad_fn=<MseLossBackward>)
output :  tensor([[223019.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2236e+09, grad_fn=<MseLossBackward>)
output :  tensor([[125278.3828]], grad_fn=<AddmmBackward>)
loss:  tensor(2963965.7500, grad_fn=<MseLossBackward>)
output :  tensor([[126053.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(2870.6155, grad_fn=<MseLossBackward>)
output :  tensor([[224857.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(4589168., grad_fn=<MseLossBackward>)
output :  tensor([[229903.]], grad_fn=<AddmmBackward>)
loss:  tensor(16785408., grad_fn=<MseLossBackward>)
output :  tensor([[228004.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(1702494.8750, grad_fn=<MseLossBackward>)
output :  tensor([[145349.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(7026724., grad_fn=<MseLossBackward>)
output :  tensor([[207862.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(4569106.5000, grad_fn=<MseLossBackward>)
output :  tensor([[126128.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(37557364., grad_fn=<MseLossBackward>)
output :  tensor([[135319.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(7950109., grad_fn=<MseLossBackward>)
output :  tensor([[312296.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(7307560.5000, grad_fn=<MseLossBackward>)
output :  tensor([[143234.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(4993199.5000, grad_fn=<MseLossBackward>)
output :  tensor([[119600.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7669e+09, grad_fn=<MseLossBackward>)
output :  tensor([[109034.0312]], grad_fn=<AddmmBackward>)
loss:  tensor(217126.8750, grad_fn=<MseLossBackward>)
output :  tensor([[159060.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8063e+08, grad_fn=<MseLossBackward>)
output :  tensor([[183604.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(8.3030e+09, grad_fn=<MseLossBackward>)
output :  tensor([[168825.4531]], grad_fn=<AddmmBackward>)
loss:  tensor(17426842., grad_fn=<MseLossBackward>)
output :  tensor([[197317.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(13562302., grad_fn=<MseLossBackward>)
output :  tensor([[106645.2031]], grad_fn=<AddmmBackward>)
loss:  tensor(44158724., grad_fn=<MseLossBackward>)
output :  tensor([[181488.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(6190610.5000, grad_fn=<MseLossBackward>)
output :  tensor([[166462.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(2067035.2500, grad_fn=<MseLossBackward>)
output :  tensor([[140487.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2213586., grad_fn=<MseLossBackward>)
output :  tensor([[262917.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2511e+09, grad_fn=<MseLossBackward>)
output :  tensor([[143737.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(3.4501e+09, grad_fn=<MseLossBackward>)
output :  tensor([[173008.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(73.5842, grad_fn=<MseLossBackward>)
output :  tensor([[144306.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(18549710., grad_fn=<MseLossBackward>)
output :  tensor([[202297.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(3232747.7500, grad_fn=<MseLossBackward>)
output :  tensor([[169559.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(193888.8594, grad_fn=<MseLossBackward>)
output :  tensor([[241849.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(4625456.5000, grad_fn=<MseLossBackward>)
output :  tensor([[135314.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(663053.9375, grad_fn=<MseLossBackward>)
output :  tensor([[151522.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(4718806., grad_fn=<MseLossBackward>)
output :  tensor([[215584.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(341932.5625, grad_fn=<MseLossBackward>)
output :  tensor([[161150.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(14817327., grad_fn=<MseLossBackward>)
output :  tensor([[191024.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(4100372., grad_fn=<MseLossBackward>)
output :  tensor([[132058.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(7.2583e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128119.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(775995.8125, grad_fn=<MseLossBackward>)
output :  tensor([[140754.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(569600.3750, grad_fn=<MseLossBackward>)
output :  tensor([[207219.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8789e+09, grad_fn=<MseLossBackward>)
output :  tensor([[167947.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8034e+09, grad_fn=<MseLossBackward>)
output :  tensor([[72253.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5016e+08, grad_fn=<MseLossBackward>)
output :  tensor([[95086.1953]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1207e+08, grad_fn=<MseLossBackward>)
output :  tensor([[259426.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(37619824., grad_fn=<MseLossBackward>)
output :  tensor([[202815.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(4.0725e+09, grad_fn=<MseLossBackward>)
output :  tensor([[115311.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(97080.9297, grad_fn=<MseLossBackward>)
output :  tensor([[159923.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(7.6048e+08, grad_fn=<MseLossBackward>)
output :  tensor([[212476.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(56608224., grad_fn=<MseLossBackward>)
output :  tensor([[182973.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5736e+09, grad_fn=<MseLossBackward>)
output :  tensor([[159790.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(22951136., grad_fn=<MseLossBackward>)
output :  tensor([[170029.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(857.3916, grad_fn=<MseLossBackward>)
output :  tensor([[112487.8516]], grad_fn=<AddmmBackward>)
loss:  tensor(6310890., grad_fn=<MseLossBackward>)
output :  tensor([[158409.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(11627141., grad_fn=<MseLossBackward>)
output :  tensor([[193216.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8723e+08, grad_fn=<MseLossBackward>)
output :  tensor([[216391.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(9662092., grad_fn=<MseLossBackward>)
output :  tensor([[245628.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2.4937e+11, grad_fn=<MseLossBackward>)
output :  tensor([[145331.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2782589., grad_fn=<MseLossBackward>)
output :  tensor([[111045.4297]], grad_fn=<AddmmBackward>)
loss:  tensor(6581429.5000, grad_fn=<MseLossBackward>)
output :  tensor([[170711.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2519e+08, grad_fn=<MseLossBackward>)
output :  tensor([[145419.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(25809734., grad_fn=<MseLossBackward>)
output :  tensor([[235162.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(3375430.2500, grad_fn=<MseLossBackward>)
output :  tensor([[116861.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(3465182.2500, grad_fn=<MseLossBackward>)
output :  tensor([[176683.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(38641764., grad_fn=<MseLossBackward>)
output :  tensor([[185740.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(920580.3125, grad_fn=<MseLossBackward>)
output :  tensor([[165515.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(2.3865e+10, grad_fn=<MseLossBackward>)
output :  tensor([[95452.9922]], grad_fn=<AddmmBackward>)
loss:  tensor(2.0889e+08, grad_fn=<MseLossBackward>)
output :  tensor([[235639.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(11296006., grad_fn=<MseLossBackward>)
output :  tensor([[178679.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(7180976.5000, grad_fn=<MseLossBackward>)
output :  tensor([[139496.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(253512.2500, grad_fn=<MseLossBackward>)
output :  tensor([[233945.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1112233.8750, grad_fn=<MseLossBackward>)
output :  tensor([[163278.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(77788.6953, grad_fn=<MseLossBackward>)
output :  tensor([[207598.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3783e+10, grad_fn=<MseLossBackward>)
output :  tensor([[133475.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(2324910.2500, grad_fn=<MseLossBackward>)
output :  tensor([[188299.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(6.9168e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133057.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(8656651., grad_fn=<MseLossBackward>)
output :  tensor([[225483.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1059e+08, grad_fn=<MseLossBackward>)
output :  tensor([[226592.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4792e+08, grad_fn=<MseLossBackward>)
output :  tensor([[92235.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4995784., grad_fn=<MseLossBackward>)
output :  tensor([[158162.0156]], grad_fn=<AddmmBackward>)
loss:  tensor(1617944.2500, grad_fn=<MseLossBackward>)
output :  tensor([[249937.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(1.4627e+10, grad_fn=<MseLossBackward>)
output :  tensor([[144365.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(402550.5938, grad_fn=<MseLossBackward>)
output :  tensor([[108921.6641]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7574e+09, grad_fn=<MseLossBackward>)
output :  tensor([[169928.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(29471496., grad_fn=<MseLossBackward>)
output :  tensor([[143720.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(78277.5469, grad_fn=<MseLossBackward>)
output :  tensor([[129073.9453]], grad_fn=<AddmmBackward>)
loss:  tensor(763780.4375, grad_fn=<MseLossBackward>)
output :  tensor([[189145.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(4.8797e+09, grad_fn=<MseLossBackward>)
output :  tensor([[123939.0859]], grad_fn=<AddmmBackward>)
loss:  tensor(2070968.3750, grad_fn=<MseLossBackward>)
output :  tensor([[149488.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(6306847.5000, grad_fn=<MseLossBackward>)
output :  tensor([[168887.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(8191312.5000, grad_fn=<MseLossBackward>)
output :  tensor([[148621.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(5656296., grad_fn=<MseLossBackward>)
output :  tensor([[157676.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(27282014., grad_fn=<MseLossBackward>)
output :  tensor([[136543.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(7.5864e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133976.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(3904884.7500, grad_fn=<MseLossBackward>)
output :  tensor([[156165.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(2.9466e+08, grad_fn=<MseLossBackward>)
output :  tensor([[146522.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(5617640.5000, grad_fn=<MseLossBackward>)
output :  tensor([[162848.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1206427.6250, grad_fn=<MseLossBackward>)
output :  tensor([[133344.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(5.4964e+08, grad_fn=<MseLossBackward>)
output :  tensor([[149758.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(917883.7500, grad_fn=<MseLossBackward>)
output :  tensor([[184280.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(13834796., grad_fn=<MseLossBackward>)
output :  tensor([[171280.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(5202747., grad_fn=<MseLossBackward>)
output :  tensor([[180843.2344]], grad_fn=<AddmmBackward>)
loss:  tensor(711044.1875, grad_fn=<MseLossBackward>)
output :  tensor([[219394.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(366441.0625, grad_fn=<MseLossBackward>)
output :  tensor([[107809.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(8138.0132, grad_fn=<MseLossBackward>)
output :  tensor([[133105.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(67331512., grad_fn=<MseLossBackward>)
output :  tensor([[285457.]], grad_fn=<AddmmBackward>)
loss:  tensor(294849., grad_fn=<MseLossBackward>)
output :  tensor([[119324.9297]], grad_fn=<AddmmBackward>)
loss:  tensor(11055157., grad_fn=<MseLossBackward>)
output :  tensor([[177788.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7818e+09, grad_fn=<MseLossBackward>)
output :  tensor([[185419.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(176229.4219, grad_fn=<MseLossBackward>)
output :  tensor([[195229.7344]], grad_fn=<AddmmBackward>)
loss:  tensor(94667728., grad_fn=<MseLossBackward>)
output :  tensor([[251876.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(5.3468e+08, grad_fn=<MseLossBackward>)
output :  tensor([[221317.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(465998.2188, grad_fn=<MseLossBackward>)
output :  tensor([[119809.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9346e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173403.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(4.1630e+08, grad_fn=<MseLossBackward>)
output :  tensor([[125496.9609]], grad_fn=<AddmmBackward>)
loss:  tensor(2240892., grad_fn=<MseLossBackward>)
output :  tensor([[183126.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(6.5359e+10, grad_fn=<MseLossBackward>)
output :  tensor([[154072.8438]], grad_fn=<AddmmBackward>)
loss:  tensor(1150993.7500, grad_fn=<MseLossBackward>)
output :  tensor([[151996.1094]], grad_fn=<AddmmBackward>)
loss:  tensor(30207218., grad_fn=<MseLossBackward>)
output :  tensor([[207721.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(2021773., grad_fn=<MseLossBackward>)
output :  tensor([[145275.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6321e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175048.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(905233.3125, grad_fn=<MseLossBackward>)
output :  tensor([[255945.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5483e+08, grad_fn=<MseLossBackward>)
output :  tensor([[147475.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(275034.6875, grad_fn=<MseLossBackward>)
output :  tensor([[202137.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(278256.2500, grad_fn=<MseLossBackward>)
output :  tensor([[162993.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(9262987., grad_fn=<MseLossBackward>)
output :  tensor([[120739.9375]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0719e+09, grad_fn=<MseLossBackward>)
output :  tensor([[133883.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(3485339., grad_fn=<MseLossBackward>)
output :  tensor([[181344.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(7049771.5000, grad_fn=<MseLossBackward>)
output :  tensor([[200181.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0366e+08, grad_fn=<MseLossBackward>)
output :  tensor([[236722.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7329e+09, grad_fn=<MseLossBackward>)
output :  tensor([[254801.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(4831616., grad_fn=<MseLossBackward>)
output :  tensor([[190518.1406]], grad_fn=<AddmmBackward>)
loss:  tensor(1.6508e+10, grad_fn=<MseLossBackward>)
output :  tensor([[143973.9531]], grad_fn=<AddmmBackward>)
loss:  tensor(2.7535e+09, grad_fn=<MseLossBackward>)
output :  tensor([[145028.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(279378.3125, grad_fn=<MseLossBackward>)
output :  tensor([[70422.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(9.2554e+08, grad_fn=<MseLossBackward>)
output :  tensor([[128279.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(45162600., grad_fn=<MseLossBackward>)
output :  tensor([[129905.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(1011988.8750, grad_fn=<MseLossBackward>)
output :  tensor([[151425.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(6630383.5000, grad_fn=<MseLossBackward>)
output :  tensor([[124009.5469]], grad_fn=<AddmmBackward>)
loss:  tensor(8942810., grad_fn=<MseLossBackward>)
output :  tensor([[76325.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(30570.3359, grad_fn=<MseLossBackward>)
output :  tensor([[84581.0078]], grad_fn=<AddmmBackward>)
loss:  tensor(6661601.5000, grad_fn=<MseLossBackward>)
output :  tensor([[224197.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(60886076., grad_fn=<MseLossBackward>)
output :  tensor([[138313.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6631e+08, grad_fn=<MseLossBackward>)
output :  tensor([[133994.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(12211093., grad_fn=<MseLossBackward>)
output :  tensor([[168277.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1630888.6250, grad_fn=<MseLossBackward>)
output :  tensor([[235982.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(965244.8750, grad_fn=<MseLossBackward>)
output :  tensor([[188531.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(13022738., grad_fn=<MseLossBackward>)
output :  tensor([[156872.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(760820.0625, grad_fn=<MseLossBackward>)
output :  tensor([[199461.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(2439160.7500, grad_fn=<MseLossBackward>)
output :  tensor([[208198.5000]], grad_fn=<AddmmBackward>)
loss:  tensor(8.2953e+08, grad_fn=<MseLossBackward>)
output :  tensor([[137082.5938]], grad_fn=<AddmmBackward>)
loss:  tensor(6821.7275, grad_fn=<MseLossBackward>)
output :  tensor([[155573.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(328579.7500, grad_fn=<MseLossBackward>)
output :  tensor([[136365.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(133635.9375, grad_fn=<MseLossBackward>)
output :  tensor([[203529.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(7.0071e+08, grad_fn=<MseLossBackward>)
output :  tensor([[154076.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(5890.5625, grad_fn=<MseLossBackward>)
output :  tensor([[135050.5156]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7264e+09, grad_fn=<MseLossBackward>)
output :  tensor([[146494.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(2541533.5000, grad_fn=<MseLossBackward>)
output :  tensor([[207356.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(21561512., grad_fn=<MseLossBackward>)
output :  tensor([[99004.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2.8915e+08, grad_fn=<MseLossBackward>)
output :  tensor([[165347.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(4633323.5000, grad_fn=<MseLossBackward>)
output :  tensor([[129933.5234]], grad_fn=<AddmmBackward>)
loss:  tensor(3738513., grad_fn=<MseLossBackward>)
output :  tensor([[148011.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1022310.5625, grad_fn=<MseLossBackward>)
output :  tensor([[104305.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(1.7575e+09, grad_fn=<MseLossBackward>)
output :  tensor([[141274.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(14244020., grad_fn=<MseLossBackward>)
output :  tensor([[235297.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(493681.8750, grad_fn=<MseLossBackward>)
output :  tensor([[148022.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(9132767., grad_fn=<MseLossBackward>)
output :  tensor([[139686.0781]], grad_fn=<AddmmBackward>)
loss:  tensor(4778937.5000, grad_fn=<MseLossBackward>)
output :  tensor([[161760.7500]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1398e+09, grad_fn=<MseLossBackward>)
output :  tensor([[272287.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(32630872., grad_fn=<MseLossBackward>)
output :  tensor([[174245.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(569553.2500, grad_fn=<MseLossBackward>)
output :  tensor([[104357.1797]], grad_fn=<AddmmBackward>)
loss:  tensor(2500129.2500, grad_fn=<MseLossBackward>)
output :  tensor([[202907.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(5.5640e+09, grad_fn=<MseLossBackward>)
output :  tensor([[162952.9688]], grad_fn=<AddmmBackward>)
loss:  tensor(15625962., grad_fn=<MseLossBackward>)
output :  tensor([[163650.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(4.5700e+10, grad_fn=<MseLossBackward>)
output :  tensor([[99525.0703]], grad_fn=<AddmmBackward>)
loss:  tensor(1500797.2500, grad_fn=<MseLossBackward>)
output :  tensor([[124354.3359]], grad_fn=<AddmmBackward>)
loss:  tensor(569022.6875, grad_fn=<MseLossBackward>)
output :  tensor([[157698.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(2885964., grad_fn=<MseLossBackward>)
output :  tensor([[141137.4844]], grad_fn=<AddmmBackward>)
loss:  tensor(1293870.7500, grad_fn=<MseLossBackward>)
output :  tensor([[200888.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(789099.1250, grad_fn=<MseLossBackward>)
output :  tensor([[143388.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(1929060.6250, grad_fn=<MseLossBackward>)
output :  tensor([[261195.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(1175733.6250, grad_fn=<MseLossBackward>)
output :  tensor([[127340.7109]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1793e+09, grad_fn=<MseLossBackward>)
output :  tensor([[163409.5312]], grad_fn=<AddmmBackward>)
loss:  tensor(4370059.5000, grad_fn=<MseLossBackward>)
output :  tensor([[190923.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(5871762., grad_fn=<MseLossBackward>)
output :  tensor([[123544.1328]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8344e+08, grad_fn=<MseLossBackward>)
output :  tensor([[256802.2656]], grad_fn=<AddmmBackward>)
loss:  tensor(46270816., grad_fn=<MseLossBackward>)
output :  tensor([[159740.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(7.4309e+08, grad_fn=<MseLossBackward>)
output :  tensor([[243824.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(2328199.2500, grad_fn=<MseLossBackward>)
output :  tensor([[141125.6406]], grad_fn=<AddmmBackward>)
loss:  tensor(8261942., grad_fn=<MseLossBackward>)
output :  tensor([[210172.8750]], grad_fn=<AddmmBackward>)
loss:  tensor(29885.7656, grad_fn=<MseLossBackward>)
output :  tensor([[174791.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(5721290.5000, grad_fn=<MseLossBackward>)
output :  tensor([[154673.6094]], grad_fn=<AddmmBackward>)
loss:  tensor(453749.5938, grad_fn=<MseLossBackward>)
output :  tensor([[118974.7266]], grad_fn=<AddmmBackward>)
loss:  tensor(950091.8750, grad_fn=<MseLossBackward>)
output :  tensor([[242796.3281]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9619e+09, grad_fn=<MseLossBackward>)
output :  tensor([[238098.3125]], grad_fn=<AddmmBackward>)
loss:  tensor(3616415.2500, grad_fn=<MseLossBackward>)
output :  tensor([[151541.6875]], grad_fn=<AddmmBackward>)
loss:  tensor(3223147., grad_fn=<MseLossBackward>)
output :  tensor([[254560.9844]], grad_fn=<AddmmBackward>)
loss:  tensor(114931.5938, grad_fn=<MseLossBackward>)
output :  tensor([[124996.2422]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1009e+08, grad_fn=<MseLossBackward>)
output :  tensor([[175799.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(40056.2695, grad_fn=<MseLossBackward>)
output :  tensor([[162137.4375]], grad_fn=<AddmmBackward>)
loss:  tensor(4568639., grad_fn=<MseLossBackward>)
output :  tensor([[126309.5859]], grad_fn=<AddmmBackward>)
loss:  tensor(21999984., grad_fn=<MseLossBackward>)
output :  tensor([[191612.6562]], grad_fn=<AddmmBackward>)
loss:  tensor(3.8580e+09, grad_fn=<MseLossBackward>)
output :  tensor([[166341.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(5480500.5000, grad_fn=<MseLossBackward>)
output :  tensor([[163219.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(47988.3789, grad_fn=<MseLossBackward>)
output :  tensor([[155811.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(4787686., grad_fn=<MseLossBackward>)
output :  tensor([[150414.]], grad_fn=<AddmmBackward>)
loss:  tensor(264196., grad_fn=<MseLossBackward>)
output :  tensor([[170841.7656]], grad_fn=<AddmmBackward>)
loss:  tensor(3.7628e+09, grad_fn=<MseLossBackward>)
output :  tensor([[164463.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(19919764., grad_fn=<MseLossBackward>)
output :  tensor([[379548.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(19552702., grad_fn=<MseLossBackward>)
output :  tensor([[133882.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(47372676., grad_fn=<MseLossBackward>)
output :  tensor([[129818.8125]], grad_fn=<AddmmBackward>)
loss:  tensor(1.9642e+09, grad_fn=<MseLossBackward>)
output :  tensor([[279273.3438]], grad_fn=<AddmmBackward>)
loss:  tensor(3762266.2500, grad_fn=<MseLossBackward>)
output :  tensor([[160052.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(3791113.2500, grad_fn=<MseLossBackward>)
output :  tensor([[129220.9766]], grad_fn=<AddmmBackward>)
loss:  tensor(76055432., grad_fn=<MseLossBackward>)
output :  tensor([[234072.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(4293702., grad_fn=<MseLossBackward>)
output :  tensor([[180458.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(1698.9854, grad_fn=<MseLossBackward>)
output :  tensor([[150676.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(1752520.8750, grad_fn=<MseLossBackward>)
output :  tensor([[145262.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(68857.0391, grad_fn=<MseLossBackward>)
output :  tensor([[154879.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(3.2325e+08, grad_fn=<MseLossBackward>)
output :  tensor([[101368.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(1873861.5000, grad_fn=<MseLossBackward>)
output :  tensor([[70065.6719]], grad_fn=<AddmmBackward>)
loss:  tensor(1.0132e+08, grad_fn=<MseLossBackward>)
output :  tensor([[163693.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(1706738.1250, grad_fn=<MseLossBackward>)
output :  tensor([[191806.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.3100e+09, grad_fn=<MseLossBackward>)
output :  tensor([[160835.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(8037756.5000, grad_fn=<MseLossBackward>)
output :  tensor([[160687.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(10161451., grad_fn=<MseLossBackward>)
output :  tensor([[140572.4062]], grad_fn=<AddmmBackward>)
loss:  tensor(9749421., grad_fn=<MseLossBackward>)
output :  tensor([[201644.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(18534236., grad_fn=<MseLossBackward>)
output :  tensor([[141587.]], grad_fn=<AddmmBackward>)
loss:  tensor(12866569., grad_fn=<MseLossBackward>)
output :  tensor([[184054.1250]], grad_fn=<AddmmBackward>)
loss:  tensor(1.5862e+10, grad_fn=<MseLossBackward>)
output :  tensor([[148022.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(4091328., grad_fn=<MseLossBackward>)
output :  tensor([[107931.6172]], grad_fn=<AddmmBackward>)
loss:  tensor(6.2159e+08, grad_fn=<MseLossBackward>)
output :  tensor([[93522.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(228140.5625, grad_fn=<MseLossBackward>)
output :  tensor([[175709.7812]], grad_fn=<AddmmBackward>)
loss:  tensor(503789.4375, grad_fn=<MseLossBackward>)
output :  tensor([[255412.4219]], grad_fn=<AddmmBackward>)
loss:  tensor(24875936., grad_fn=<MseLossBackward>)
output :  tensor([[140031.9219]], grad_fn=<AddmmBackward>)
loss:  tensor(2155253.5000, grad_fn=<MseLossBackward>)
output :  tensor([[159021.5625]], grad_fn=<AddmmBackward>)
loss:  tensor(762893.0625, grad_fn=<MseLossBackward>)
output :  tensor([[134217.1719]], grad_fn=<AddmmBackward>)
loss:  tensor(2948679.2500, grad_fn=<MseLossBackward>)
output :  tensor([[147253.7969]], grad_fn=<AddmmBackward>)
loss:  tensor(5045428.5000, grad_fn=<MseLossBackward>)
output :  tensor([[165085.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(7923697., grad_fn=<MseLossBackward>)
output :  tensor([[128258.1875]], grad_fn=<AddmmBackward>)
loss:  tensor(1583035.7500, grad_fn=<MseLossBackward>)
output :  tensor([[170866.7188]], grad_fn=<AddmmBackward>)
loss:  tensor(6.6909e+08, grad_fn=<MseLossBackward>)
output :  tensor([[158241.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(1541011.8750, grad_fn=<MseLossBackward>)
output :  tensor([[114183.8203]], grad_fn=<AddmmBackward>)
loss:  tensor(5364688.5000, grad_fn=<MseLossBackward>)
output :  tensor([[157269.]], grad_fn=<AddmmBackward>)
loss:  tensor(5.7352e+09, grad_fn=<MseLossBackward>)
output :  tensor([[53766.1211]], grad_fn=<AddmmBackward>)
loss:  tensor(3119183.7500, grad_fn=<MseLossBackward>)
output :  tensor([[234429.5781]], grad_fn=<AddmmBackward>)
loss:  tensor(6.0950e+09, grad_fn=<MseLossBackward>)
output :  tensor([[198271.3594]], grad_fn=<AddmmBackward>)
loss:  tensor(7445479.5000, grad_fn=<MseLossBackward>)
output :  tensor([[182785.3750]], grad_fn=<AddmmBackward>)
loss:  tensor(4904564., grad_fn=<MseLossBackward>)
output :  tensor([[105210.0469]], grad_fn=<AddmmBackward>)
loss:  tensor(624025.9375, grad_fn=<MseLossBackward>)
output :  tensor([[86500.3516]], grad_fn=<AddmmBackward>)
loss:  tensor(249648.5625, grad_fn=<MseLossBackward>)
output :  tensor([[139443.2188]], grad_fn=<AddmmBackward>)
loss:  tensor(310005.3750, grad_fn=<MseLossBackward>)
output :  tensor([[223456.8594]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9763e+09, grad_fn=<MseLossBackward>)
output :  tensor([[207054.9062]], grad_fn=<AddmmBackward>)
loss:  tensor(198108.4531, grad_fn=<MseLossBackward>)
output :  tensor([[166910.7031]], grad_fn=<AddmmBackward>)
loss:  tensor(3650786.5000, grad_fn=<MseLossBackward>)
output :  tensor([[176361.8281]], grad_fn=<AddmmBackward>)
loss:  tensor(7.8567e+09, grad_fn=<MseLossBackward>)
output :  tensor([[188478.4688]], grad_fn=<AddmmBackward>)
loss:  tensor(2315057.2500, grad_fn=<MseLossBackward>)
output :  tensor([[86873.1016]], grad_fn=<AddmmBackward>)
loss:  tensor(16103.2139, grad_fn=<MseLossBackward>)
output :  tensor([[137717.8906]], grad_fn=<AddmmBackward>)
loss:  tensor(5208023., grad_fn=<MseLossBackward>)
output :  tensor([[110730.7891]], grad_fn=<AddmmBackward>)
loss:  tensor(53263.5898, grad_fn=<MseLossBackward>)
output :  tensor([[147095.0625]], grad_fn=<AddmmBackward>)
loss:  tensor(1.2399e+08, grad_fn=<MseLossBackward>)
output :  tensor([[173457.1562]], grad_fn=<AddmmBackward>)
loss:  tensor(1.8026e+09, grad_fn=<MseLossBackward>)
output :  tensor([[194342.2969]], grad_fn=<AddmmBackward>)
loss:  tensor(1.1359e+08, grad_fn=<MseLossBackward>)
output :  tensor([[180634.6250]], grad_fn=<AddmmBackward>)
loss:  tensor(402748.8750, grad_fn=<MseLossBackward>)
output :  tensor([[95846.7422]], grad_fn=<AddmmBackward>)
loss:  tensor(426745.7812, grad_fn=<MseLossBackward>)
output :  tensor([[118497.3984]], grad_fn=<AddmmBackward>)
loss:  tensor(994803.6250, grad_fn=<MseLossBackward>)
output :  tensor([[161806.2500]], grad_fn=<AddmmBackward>)
loss:  tensor(4.9256e+08, grad_fn=<MseLossBackward>)
output :  tensor([[201246.2812]], grad_fn=<AddmmBackward>)
loss:  tensor(1553217., grad_fn=<MseLossBackward>)
output :  tensor([[145099.0938]], grad_fn=<AddmmBackward>)
loss:  tensor(1208007.1250, grad_fn=<MseLossBackward>)
train_loss: [2.5573217e+09]
Out[113]:
2532927200.0
In [132]:
#test the model
ann_pred1 = model(torch.tensor(test_x.values).float())
print(mean_squared_error(test_y, ann_pred1.detach().numpy())**0.5) #rmse
99176.32901765831

3.5 model 5 - ANN(5-layers)

In [136]:
import torch
import torch.nn as nn
import torch.nn.functional as F

class MultOutRegressor2(nn.Module):
    def __init__(self, input_dim, target_dim, hidden_dim=32,seed=1234):
        super().__init__()
        torch.manual_seed(seed)
        self.hidden_dim = hidden_dim
        self.target_dim = target_dim

        self.fc1 = nn.Linear(input_dim, self.hidden_dim)
        self.fc2 = nn.Linear(self.hidden_dim, self.hidden_dim)
        self.fc3 = nn.Linear(self.hidden_dim, self.hidden_dim)
        self.fc4 = nn.Linear(self.hidden_dim, self.hidden_dim)
        self.fc5 = nn.Linear(self.hidden_dim, self.target_dim)

    def forward(self, x):
        x = self.fc1(x)
        x = F.relu(x)
        x = self.fc2(x)
        x = F.relu(x)
        x = self.fc3(x)
        x = F.relu(x)
        x = self.fc4(x)
        x = F.relu(x)
        x = self.fc5(x)
        return x
In [137]:
from torch import optim
from IPython import display

#convert dataframe to array for DataLoader 
numpy_x = train_x.to_numpy()
numpy_y = train_y.to_numpy()

tabulardataset = TabularDataSet(numpy_x,numpy_y) 
train_dl = DataLoader(tabulardataset) 
model2 = MultOutRegressor2(131 , 1)
optimizer = optim.AdamW(model2.parameters(), lr=0.001) #default lr = 0.01
criterion = nn.MSELoss()
In [138]:
#train the model
train(500, train_dl ,model2, criterion , optimizer,log_interval=50) #default n_epochs = 500 : min_loss = 481092860
epoch_result tensor([0.])
C:\Users\KIM\anaconda3\lib\site-packages\torch\nn\modules\loss.py:528: UserWarning: Using a target size (torch.Size([1])) that is different to the input size (torch.Size([1, 1])). This will likely lead to incorrect results due to broadcasting. Please ensure they have the same size.
  return F.mse_loss(input, target, reduction=self.reduction)
train_loss: [4.9113827e+08]
epoch_result tensor([0.])
train_loss: [5.0928346e+08]
epoch_result tensor([0.])
train_loss: [4.8858035e+08]
epoch_result tensor([0.])
train_loss: [5.054563e+08]
epoch_result tensor([0.])
train_loss: [4.642146e+08]
epoch_result tensor([0.])
train_loss: [4.9271334e+08]
epoch_result tensor([0.])
train_loss: [4.5723866e+08]
epoch_result tensor([0.])
train_loss: [4.9392486e+08]
epoch_result tensor([0.])
train_loss: [4.8612915e+08]
epoch_result tensor([0.])
train_loss: [4.97068e+08]
epoch_result tensor([0.])
train_loss: [4.78047e+08]
epoch_result tensor([0.])
train_loss: [4.8552918e+08]
epoch_result tensor([0.])
train_loss: [4.7697274e+08]
epoch_result tensor([0.])
train_loss: [5.0382544e+08]
epoch_result tensor([0.])
train_loss: [4.780008e+08]
epoch_result tensor([0.])
train_loss: [4.8170496e+08]
epoch_result tensor([0.])
train_loss: [4.9221597e+08]
epoch_result tensor([0.])
train_loss: [4.7680704e+08]
epoch_result tensor([0.])
train_loss: [5.0511542e+08]
epoch_result tensor([0.])
train_loss: [4.771694e+08]
epoch_result tensor([0.])
train_loss: [4.908408e+08]
epoch_result tensor([0.])
train_loss: [4.6922378e+08]
epoch_result tensor([0.])
train_loss: [4.9566358e+08]
epoch_result tensor([0.])
train_loss: [4.9555827e+08]
epoch_result tensor([0.])
train_loss: [4.864274e+08]
epoch_result tensor([0.])
train_loss: [4.6648477e+08]
epoch_result tensor([0.])
train_loss: [4.719006e+08]
epoch_result tensor([0.])
train_loss: [4.9165642e+08]
epoch_result tensor([0.])
train_loss: [4.7974573e+08]
epoch_result tensor([0.])
train_loss: [4.680593e+08]
epoch_result tensor([0.])
train_loss: [4.8055568e+08]
epoch_result tensor([0.])
train_loss: [4.677812e+08]
epoch_result tensor([0.])
train_loss: [5.188944e+08]
epoch_result tensor([0.])
train_loss: [4.9198992e+08]
epoch_result tensor([0.])
train_loss: [4.444261e+08]
epoch_result tensor([0.])
train_loss: [4.906883e+08]
epoch_result tensor([0.])
train_loss: [4.7040045e+08]
epoch_result tensor([0.])
train_loss: [4.697956e+08]
epoch_result tensor([0.])
train_loss: [4.9643437e+08]
epoch_result tensor([0.])
train_loss: [4.6591907e+08]
epoch_result tensor([0.])
train_loss: [4.9983146e+08]
epoch_result tensor([0.])
train_loss: [4.782167e+08]
epoch_result tensor([0.])
train_loss: [4.6784163e+08]
epoch_result tensor([0.])
train_loss: [4.9556246e+08]
epoch_result tensor([0.])
train_loss: [4.748582e+08]
epoch_result tensor([0.])
train_loss: [4.8011414e+08]
epoch_result tensor([0.])
train_loss: [4.906535e+08]
epoch_result tensor([0.])
train_loss: [4.738452e+08]
epoch_result tensor([0.])
train_loss: [4.8260592e+08]
Out[138]:
444426100.0
In [139]:
#test the model
ann_pred2 = model2(torch.tensor(test_x.values).float())
print(mean_squared_error(test_y, ann_pred2.detach().numpy())**0.5) #rmse
147314.16941653125

cf) Tuning model's hyperparameters with K-fold cross validation

In [36]:
#training data for k-fold cross validation 
train_x_kf = pd.concat([train_x, valid_x], axis = 0)
train_y_kf = pd.concat([train_y, valid_y], axis = 0)

Random Forest - K-fold cross validation

In [39]:
from sklearn.model_selection import RandomizedSearchCV

#define rf_grid
# Number of trees in Random Forest
rf_n_estimators = [int(x) for x in np.linspace(200, 1000, 5)]
rf_n_estimators.append(1500)
rf_n_estimators.append(2000)

# Maximum number of levels in tree
rf_max_depth = [int(x) for x in np.linspace(5, 55, 11)]
# Add the default as a possible value
rf_max_depth.append(None)

# Number of features to consider at every split
rf_max_features = ['auto', 'sqrt', 'log2']

# Criterion to split on
#rf_criterion = ['mse', 'mae']

# Minimum number of samples required to split a node
rf_min_samples_split = [int(x) for x in np.linspace(2, 10, 9)]

# Minimum decrease in impurity required for split to happen
rf_min_impurity_decrease = [0.0, 0.05, 0.1]

# Method of selecting samples for training each tree
rf_bootstrap = [True, False]

rf_grid = {'n_estimators': rf_n_estimators,
               'max_depth': rf_max_depth,
               'max_features': rf_max_features,
               #'criterion': rf_criterion,
               'min_samples_split': rf_min_samples_split,
               'min_impurity_decrease': rf_min_impurity_decrease,
               'bootstrap': rf_bootstrap}

# Create the model to be tuned
rf_base = RandomForestRegressor()

# Create the random search Random Forest
rf_random = RandomizedSearchCV(estimator = rf_base, param_distributions = rf_grid, 
                               n_iter = 200, cv = 3, verbose = 2, random_state = 42, 
                               n_jobs = -1)

# Fit the random search model
rf_random.fit(train_x_kf, train_y_kf)

# View the best parameters from the random search
rf_random.best_params_
Fitting 3 folds for each of 200 candidates, totalling 600 fits
[Parallel(n_jobs=-1)]: Using backend LokyBackend with 8 concurrent workers.
[Parallel(n_jobs=-1)]: Done  25 tasks      | elapsed:  3.6min
[Parallel(n_jobs=-1)]: Done 146 tasks      | elapsed: 15.7min
[Parallel(n_jobs=-1)]: Done 349 tasks      | elapsed: 327.5min
[Parallel(n_jobs=-1)]: Done 600 out of 600 | elapsed: 369.1min finished
Out[39]:
{'n_estimators': 2000,
 'min_samples_split': 8,
 'min_impurity_decrease': 0.1,
 'max_features': 'log2',
 'max_depth': 5,
 'bootstrap': False}
In [40]:
#now try with random forest with "best" parameters
from sklearn.ensemble import RandomForestRegressor
from sklearn.metrics import accuracy_score # 정확도 함수

clf_cv = RandomForestRegressor(n_estimators=200, max_depth=5,random_state=0,min_samples_split=8,min_impurity_decrease=0.1,max_features='log2',bootstrap=True)

clf_cv.fit(train_x,train_y)

predict1 = clf_cv.predict(test_x)
In [41]:
#MSE
from sklearn.metrics import mean_squared_error 
print(mean_squared_error(test_y, predict1)**0.5) #rmse
74292.61483889371

4. Ensemble with linear model at the end

https://www.analyticsvidhya.com/blog/2018/06/comprehensive-guide-for-ensemble-models/ (ensemble idea in this link is based on the k-fold cross validation to all base models)

- Each model's predict_y becomes the column of new train _X for linear model.

- Train_y(actual y values) becomes new train _Y for linear model

- Since we used 5 regression models, the final linear regression ensemble model has train _X of 5 columns and train_y of 1 column

In [ ]:
new_train_x = pd.concat([rf_pred_y, gbm_pred_y, xgboost_pred_y, ligbm_pred_y, ann_3_pred_y, ann_5_pred_y], axis=1)
new_train_y = train_y

new_test_x = test_x
new_test_y = test_y

ensemble_model = LogisticRegressor()

#train ensemble model with new_train_x and new_train_y
#test ensembel model with new_test_x and new_test_y